<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">779455</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2021.779455</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Identifying Potential miRNA Biomarkers for Gastric Cancer Diagnosis Using Machine Learning Variable Selection Approach</article-title>
<alt-title alt-title-type="left-running-head">Gilani et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">miRNAs as Gastric Cancer Biomarkers</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Gilani</surname>
<given-names>Neda</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1421961/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Arabi Belaghi</surname>
<given-names>Reza</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1361170/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Aftabi</surname>
<given-names>Younes</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1112385/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Faramarzi</surname>
<given-names>Elnaz</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/833467/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Edg&#xfc;nl&#xfc;</surname>
<given-names>Tuba</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Somi</surname>
<given-names>Mohammad Hossein</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Statistics and Epidemiology, Faculty of Health, Tabriz University of Medical Sciences</institution>, <addr-line>Tabriz</addr-line>, <country>Iran</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Mathematics, Uppsala University</institution>, <addr-line>Uppsala</addr-line>, <country>Sweden</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Statistics, Faculty of Mathematical Science, University of Tabriz</institution>, <addr-line>Tabriz</addr-line>, <country>Iran</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Tuberculosis and Lung Diseases Research Center, Tabriz University of Medical Sciences</institution>, <addr-line>Tabriz</addr-line>, <country>Iran</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Liver and Gastrointestinal Diseases Research Center, Tabriz University of Medical Sciences</institution>, <addr-line>Tabriz</addr-line>, <country>Iran</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Department of Medical Biology, Faculty of Medicine, Mu&#x11f;la S&#x131;tk&#x131; Ko&#xe7;man University</institution>, <addr-line>Mu&#x11f;la</addr-line>, <country>Turkey</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/800132/overview">Tao Wang</ext-link>, Northwestern Polytechnical University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1503047/overview">Xiawei Li</ext-link>, Zhejiang University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/782267/overview">Yanshuo Chu</ext-link>, University of Texas MD Anderson Cancer Center, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Neda Gilani, <email>gilanin@tbzmed.ac.ir</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Statistical Genetics and Methodology, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>10</day>
<month>01</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>779455</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Gilani, Arabi Belaghi, Aftabi, Faramarzi, Edg&#xfc;nl&#xfc; and Somi.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Gilani, Arabi Belaghi, Aftabi, Faramarzi, Edg&#xfc;nl&#xfc; and Somi</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Aim:</bold> This study aimed to accurately identification of potential miRNAs for gastric cancer (GC) diagnosis at the early stages of the disease.</p>
<p>
<bold>Methods:</bold> We used GSE106817 data with 2,566 miRNAs to train the machine learning models. We used the Boruta machine learning variable selection approach to identify the strong miRNAs associated with GC in the training sample. We then validated the prediction models in the independent sample GSE113486 data. Finally, an ontological analysis was done on identified miRNAs to eliciting the relevant relationships.</p>
<p>
<bold>Results:</bold> Of those 2,874 patients in the training the model, there were 115 (4%) patients with GC. Boruta identified 30 miRNAs as potential biomarkers for GC diagnosis and hsa-miR-1343-3p was at the highest ranking. All of the machine learning algorithms showed that using hsa-miR-1343-3p as a biomarker, GC can be predicted with very high precision (AUC; 100%, sensitivity; 100%, specificity; 100% ROC; 100%, Kappa; 100) using with the cut-off point of 8.2 for hsa-miR-1343-3p. Also, ontological analysis of 30 identified miRNAs approved their strong relationship with cancer associated genes and molecular events.</p>
<p>
<bold>Conclusion:</bold> The hsa-miR-1343-3p could be introduced as a valuable target for studies on the GC diagnosis using reliable biomarkers.</p>
</abstract>
<kwd-group>
<kwd>miRNA</kwd>
<kwd>machine learning</kwd>
<kwd>boruta algorithm</kwd>
<kwd>gastric cancer</kwd>
<kwd>hsa-miR-1343-3p</kwd>
<kwd>AUC</kwd>
<kwd>GSE106817</kwd>
<kwd>GSE113486</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Gastric cancer (GC) is a significant global health issue due to being the fifth leading cancer worldwide as well as the third cancer-related death leading cause, which leads to nearly 8,00,000 deaths annually (<xref ref-type="bibr" rid="B4">Bray, 2018</xref>). Morbidity and mortality due to GC have reduced in recent years, though the rate of 5-year survival is still fairly low (<xref ref-type="bibr" rid="B27">Howlader, 2014</xref>). A significant prognostic factor is the stage of cancer at the diagnosis time. The 5-year survival of GC patients is below 30% if the disease is diagnosed at the advanced stages (<xref ref-type="bibr" rid="B28">Hundahl et&#x20;al., 2000</xref>), while the 5-year survival of patients ranges between 70 and 90% if diagnosed at the early stages (<xref ref-type="bibr" rid="B8">Choi, 2015</xref>). Thus, GC will remain among the toughest challenges for physicians and researchers for so long since GC is not symptomatic until the advanced stages; this is why effective screening approaches for the early detection of GC are mandatory to overcome GC mortalities (<xref ref-type="bibr" rid="B40">Penon et&#x20;al., 2014</xref>). Presently, gastroscopy is yet the standard test to diagnose GC (<xref ref-type="bibr" rid="B51">Veitch et&#x20;al., 2015</xref>). Nonetheless, this screening approach is invasive and costly. Furthermore, minimally invasive or non-invasive markers, including carcinoembryonic antigen (CEA) and carbohydrate antigen 19-9 (CA19-9) have been commonly used clinically, though these markers are neither specific nor sensitive enough for GC early diagnosis (<xref ref-type="bibr" rid="B6">Carpelan-Holmstr&#xf6;m et&#x20;al., 2002</xref>). Due to non-specific symptoms and the absence of an early diagnosis, a great number of patients with GC are diagnosed at the advanced stages (<xref ref-type="bibr" rid="B28">Hundahl et&#x20;al., 2000</xref>; <xref ref-type="bibr" rid="B24">Hartgrink et&#x20;al., 2009</xref>). Thus, cost-effective and non-invasive biomarkers are immediately required for the early diagnosis of&#x20;GC.</p>
<p>Recent genome analysis revealed several biomarkers which are related to RNA, DNA, exosome, et cetera. A class of endogenous non-coding RNAs is MicroRNAs (miRNAs) (nearly 22&#xa0;nt) which module the expression of the gene after transcription through degradation or translation blockage of target mRNAs (<xref ref-type="bibr" rid="B3">Bartel, 2004</xref>; <xref ref-type="bibr" rid="B5">Caldas and Brenton, 2005</xref>). It is well-known that cancer cells may release miRNAs via exosomes to enhance proliferation and migration (<xref ref-type="bibr" rid="B33">Li, 2018</xref>; <xref ref-type="bibr" rid="B58">Yoshimura, 2018</xref>; <xref ref-type="bibr" rid="B60">Zeng, 2018</xref>). The exosomal miRNAs released into biofluids, including serum, plasma, tear, urine, and gastric juice, may escape being degraded by RNases (<xref ref-type="bibr" rid="B19">Gilad, 2008</xref>). Moreover, miRNAs have been suggested as potential biomarkers which may be used to diagnose several types of cancers, including testicular germ cell tumors (using miRNA-371a-3p: specificity 94.0% and sensitivity 90.1%) (<xref ref-type="bibr" rid="B15">Dieckmann, 2019</xref>), bladder cancer (using 7-miRNA panel: specificity 87% and sensitivity 95%) (<xref ref-type="bibr" rid="B48">Usuba, 2019a</xref>), and hepatocellular carcinoma (using miR-424: specificity 87.13% and sensitivity 95.12%) (<xref ref-type="bibr" rid="B34">Lin, 2015</xref>), and lung cancer (<xref ref-type="bibr" rid="B1">Aftabi, 2021</xref>). Moreover, several studies reported that numerous miRNAs might be potentially used as biomarkers for GC diagnosis (<xref ref-type="bibr" rid="B64">Zhou, 2010</xref>; <xref ref-type="bibr" rid="B11">Cui, 2013</xref>; <xref ref-type="bibr" rid="B44">Su, 2014</xref>). Nonetheless, most of the miRNA biomarkers are not developed using comprehensive data mining according to miRNA profiling, and even they lack proper external efficacy validation (<xref ref-type="bibr" rid="B35">Link and Kupcinskas, 2018</xref>; <xref ref-type="bibr" rid="B52">Wei, 2019</xref>). Instead, recently, Artificial intelligence Technology (AT) usage in the field of microarray Data has attracted more attention. The disadvantage of the conventional statistical models, including logistic regression, was that they excluded the possible interaction terms and highly correlated variables; thus, they might lose a part of useful information, which might decrease their accuracy, specifically in the case of high dimensional miRNA data analysis (<xref ref-type="bibr" rid="B2">Alpaydin, 2020</xref>). Furthermore, the traditional models are not able to capture variables&#x2019; non-linear associations (<xref ref-type="bibr" rid="B29">James et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B22">Gilani et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B21">Gilani et&#x20;al., 2019</xref>). Instead, Machine Learning (ML) is able to deal with non-linear structures as well as detecting all the possible interactions which may exist between predictors (<xref ref-type="bibr" rid="B20">Gilani et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B53">Wiemken and Kelley, 2020</xref>).</p>
<p>Machine learning has several algorithms of which the decision trees (DT), random forests (RF), extreme gradient boosted trees (XGBT), and artificial neural networks (ANN) that have been frequently applied in medicine (<xref ref-type="bibr" rid="B10">Cleophas and Zwinderman, 2015</xref>; <xref ref-type="bibr" rid="B14">Deo, 2015</xref>), particularly in prediction of cancer (<xref ref-type="bibr" rid="B13">DeGregory, 2018</xref>; <xref ref-type="bibr" rid="B16">Fakhari et&#x20;al., 2019</xref>). Random forest is a tree-based classification algorithm, and as the name indicates, the algorithm creates a forest with a huge number of trees. It is an ensemble algorithm that combines multiple algorithms. The random forest creates a set of decision trees from a random sample of the training set. It repeats the process with multiple random samples and makes a final decision based on majority voting (<xref ref-type="bibr" rid="B66">Zhou, 2012</xref>). Briefly, gradient boosted trees combine multiple classification trees into an additively weighted classifier. Boosting refers to the method where sequentially ascertained trees were trained, meaning each observation was weighted by its error obtained by minimizing the appropriate loss of function in the previous iteration. In this way, boosting is a gradient descent algorithm (<xref ref-type="bibr" rid="B9">Christensen and Bastien, 2016</xref>) and forces the classifier to focus on aspects of the data that are difficult to learn (<xref ref-type="bibr" rid="B25">Hastie et&#x20;al., 2009</xref>).</p>
<p>Artificial neural networks have been broadly used in medical studies (<xref ref-type="bibr" rid="B12">Darsey et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B13">DeGregory, 2018</xref>; <xref ref-type="bibr" rid="B41">Shahid et&#x20;al., 2019</xref>). Such models perform satisfactorily, especially for classification problems with complex and non-linear associations between variables (<xref ref-type="bibr" rid="B25">Hastie et&#x20;al., 2009</xref>). Briefly, artificial neural networks are based on a collection of artificial neurons, which receive and process inputs (predictors), transmit them to other artificial neurons, and produce an output (<xref ref-type="bibr" rid="B66">Zhou, 2012</xref>).</p>
<p>Considering the important role of GC early diagnosis in patient&#x2019;s survival rate and the lack of published article on identifying potential miRNAs for GC prediction at an early stage by AT, the present study aims to identify the potential miRNA for predicting GC by AT in the datasets of Gene Expression Omnibus (GEO) specifically with the stat of the art machine learning models. Traditional statistical models such as linear models previously has been used in looking for GC biomarkers and identified miRNAs with the potential prediction power (<xref ref-type="bibr" rid="B56">Yao, 2020</xref>), however, they have not implemented advanced methods such as machine learning and new variable selection approaches such as Synthetic Minority <italic>Oversampling</italic> Technique (SMOTE). In the present study, for the first time, we aimed to use those new techniques for identification of GC related miRNAs with a reliable cut-of and highest possible accurecy in the external validation.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec id="s2-1">
<title>The Applied Datasets</title>
<p>For training sample, we used GSE106817 dataset that is available at <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>. The dataset consist of the data of 2,566 miRNAs obtained from 2,759&#x20;non-cancer controls, and 115&#xa0;GC cases (4%). In the original study the serum samples of cancer cases and non-cancer controls have been analyzed by microarray for miRNA expression profiles (<xref ref-type="bibr" rid="B57">Yokoi, 2018</xref>). For test sample we used GSE113486 dataset, which includes data of miRNA expression profiles from the serum samples of 40&#xa0;GC cases (28.6%) and 100 normal controls (71.4%) (<xref ref-type="bibr" rid="B49">Usuba, 2019b</xref>). All the datasets were serum miRNA profiles based on the same microarray platform, 3D-Gene Huma miRNA V21_1.0.0 (39). The study was approved by the NCCH Institutional Review Board (2015-376, 2016-29) and the Research Ethics Committee of Medical Corporation Shintokai Yokohama Minoru Clinic (6019-18-3772). Written informed consent was obtained from each participant&#x20;(42). This study was approved by the Ethics Committee of Tabriz University of Medical Sciences (No: IR. TBZMED.REC.1400.006).</p>
</sec>
<sec id="s2-2">
<title>Boruta Machine Learning Algorithm</title>
<p>We used the Boruta machine learning algorithm to select the most critical miRNAs related to GC in the training sample that produce the highest prediction accuracy. In short, Boruta selects the variables that have a high impact on the prediction accuracy by providing the &#x201c;variable importance&#x201d; (<xref ref-type="bibr" rid="B32">Kursa and Rudnicki, 2018</xref>). We used SMOTE random oversampling to balance the outcome in the GSE106817 data. We then used five-fold cross-validation to find the optimal hyper parameters on DT, RF, LR, XGBT, and ANN to choose the best approaches in the balanced sample using the most important variables selected by Boruta. Once the prediction models were developed, we applied them on the test sample GSE113486 to verify the accuracy of developed prediction approach. We looked for an algorithm that may generate a higher predictive power among the 5&#xa0;ML algorithms in terms of the yielded areas under the ROC curves (AUCs). Sensitivity, specificity, positive predictive value, negative predictive value, misclassification rate, and Kappa were assessed. The guidelines of developing transparent multivariable prediction models was followed for these analysis (<xref ref-type="bibr" rid="B39">Moons, 2015</xref>).</p>
</sec>
<sec id="s2-3">
<title>GeneCodis Ontological Analysis</title>
<p>GeneCodis is a web-based tool for the ontological analysis of lists of genes, proteins, and regulatory elements like miRNAs, transcription factors, and CpGs. It can be used to determine biological annotations or combinations of annotations that are significantly associated to a list of genes under study with respect to a reference list. As well as single annotations, this tool allows users to simultaneously evaluate annotations from different sources, for example GO Biological Process and KEGG. To this end, and before computing <italic>p</italic>-values, it uses the apriori algorithm to extract sets of annotations that frequently co-occur in the analyzed list of genes (<xref ref-type="bibr" rid="B18">Garcia-Moreno, 2021</xref>). We used GeneCodis 4 (<ext-link ext-link-type="uri" xlink:href="https://genecodis.genyo.es/">https://genecodis.genyo.es/</ext-link>) for ontological analysis of the identified miRNAs&#x20;list.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>Of those 2,874 patients included in this study, there were 115 (4%) patients with gastric cancer. This analysis consists of 2,566 miRNAs.</p>
<sec id="s3-1">
<title>Selected miRNAs as Potential GC Biomarkers</title>
<p>Of those 2,566 miRNA in GSE106817 data, the Boruta algorithm initially selected 108 miRNA using Gini Index measurement (results are not shown here). The processing time was 17.24 minuts There were 77 tentative variables at the first stage. After fixing the tentative features, Boruta identified 156 miRNA for the analysis (results are not shown here). The process took 99 iterations convergence. It was observed that hsa-miR-1343-3p had the highest importance for prediction accurecy (minimum importance; 6.47, median importance; 11.44, mean importance; 10.81; maximum importance; 13.63) among all identified miRNAs. The hsa-miR-1290 and hsa-miR-5100 had the second and third highest importance, with mean importance of 8.69 and 8.66, respectively (<xref ref-type="table" rid="T1">Table&#x20;1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Selected important miRNAs by Boruta Algorithm Using XGboost Algorithm.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">No</th>
<th align="center">miRNA</th>
<th align="center">Importance</th>
<th align="center">Se (%)</th>
<th align="center">Sp (%)</th>
<th align="center">PPV (%)</th>
<th align="center">NPV (%)</th>
<th align="center">AUC (%)</th>
<th align="center">Accuracy (%)</th>
<th align="center">Kappa (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">1</td>
<td align="left">hsa-miR-1343-3p</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="center">2</td>
<td align="left">hsa-miR-1290</td>
<td align="char" char=".">80.39</td>
<td align="char" char=".">92.50</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">94.87</td>
<td align="char" char=".">97.03</td>
<td align="char" char=".">99.05</td>
<td align="char" char=".">96.43</td>
<td align="char" char=".">0.96</td>
</tr>
<tr>
<td align="center">3</td>
<td align="left">hsa-miR-5100</td>
<td align="char" char=".">80.11</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.00</td>
<td align="char" char=".">97.56</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.23</td>
<td align="char" char=".">99.29</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="center">4</td>
<td align="left">hsa-miR-6746-5p</td>
<td align="char" char=".">64.57</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">93.00</td>
<td align="char" char=".">85.11</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">97.23</td>
<td align="char" char=".">95.00</td>
<td align="char" char=".">0.95</td>
</tr>
<tr>
<td align="center">5</td>
<td align="left">hsa-miR-4532</td>
<td align="char" char=".">64.85</td>
<td align="char" char=".">67.50</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">88.50</td>
<td align="char" char=".">95.11</td>
<td align="char" char=".">90.71</td>
<td align="char" char=".">0.91</td>
</tr>
<tr>
<td align="center">6</td>
<td align="left">hsa-miR-8073</td>
<td align="char" char=".">61.79</td>
<td align="char" char=".">97.50</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.01</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.29</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="center">7</td>
<td align="left">hsa-miR-1228-5p</td>
<td align="char" char=".">56.24</td>
<td align="char" char=".">97.50</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.01</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">99.29</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="center">8</td>
<td align="left">hsa-miR-1199-5p</td>
<td align="char" char=".">54.12</td>
<td align="char" char=".">62.50</td>
<td align="char" char=".">97.00</td>
<td align="char" char=".">89.29</td>
<td align="char" char=".">86.61</td>
<td align="char" char=".">92.56</td>
<td align="char" char=".">87.14</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="center">9</td>
<td align="left">hsa-miR-3622a-5p</td>
<td align="char" char=".">54.49</td>
<td align="char" char=".">80.00</td>
<td align="char" char=".">99.00</td>
<td align="char" char=".">96.97</td>
<td align="char" char=".">92.52</td>
<td align="char" char=".">97.26</td>
<td align="char" char=".">93.57</td>
<td align="char" char=".">0.94</td>
</tr>
<tr>
<td align="center">10</td>
<td align="left">hsa-miR-8060</td>
<td align="char" char=".">53.75</td>
<td align="char" char=".">85.00</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">94.44</td>
<td align="char" char=".">94.23</td>
<td align="char" char=".">98.79</td>
<td align="char" char=".">94.29</td>
<td align="char" char=".">0.94</td>
</tr>
<tr>
<td align="center">11</td>
<td align="left">hsa-miR-1246</td>
<td align="char" char=".">50.42</td>
<td align="char" char=".">92.50</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">97.09</td>
<td align="char" char=".">99.90</td>
<td align="char" char=".">97.86</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="center">12</td>
<td align="left">hsa-miR-4787-3p</td>
<td align="char" char=".">50.32</td>
<td align="char" char=".">90.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">96.15</td>
<td align="char" char=".">98.75</td>
<td align="char" char=".">97.14</td>
<td align="char" char=".">0.97</td>
</tr>
<tr>
<td align="center">13</td>
<td align="left">hsa-miR-6087</td>
<td align="char" char=".">49.68</td>
<td align="char" char=".">22.50</td>
<td align="char" char=".">88.00</td>
<td align="char" char=".">42.86</td>
<td align="char" char=".">73.95</td>
<td align="char" char=".">62.70</td>
<td align="char" char=".">69.29</td>
<td align="char" char=".">0.69</td>
</tr>
<tr>
<td align="center">14</td>
<td align="left">hsa-miR-4259</td>
<td align="char" char=".">47.55</td>
<td align="char" char=".">90.00</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">94.74</td>
<td align="char" char=".">96.08</td>
<td align="char" char=".">99.04</td>
<td align="char" char=".">95.71</td>
<td align="char" char=".">0.96</td>
</tr>
<tr>
<td align="center">15</td>
<td align="left">hsa-miR-6877-5p</td>
<td align="char" char=".">46.90</td>
<td align="char" char=".">92.50</td>
<td align="char" char=".">94.00</td>
<td align="char" char=".">86.05</td>
<td align="char" char=".">96.91</td>
<td align="char" char=".">97.73</td>
<td align="char" char=".">93.57</td>
<td align="char" char=".">0.94</td>
</tr>
<tr>
<td align="center">16</td>
<td align="left">hsa-miR-124-3p</td>
<td align="char" char=".">45.42</td>
<td align="char" char=".">92.50</td>
<td align="char" char=".">94.00</td>
<td align="char" char=".">86.05</td>
<td align="char" char=".">96.91</td>
<td align="char" char=".">96.81</td>
<td align="char" char=".">93.57</td>
<td align="char" char=".">0.94</td>
</tr>
<tr>
<td align="center">17</td>
<td align="left">hsa-miR-6787-5p</td>
<td align="char" char=".">45.14</td>
<td align="char" char=".">87.50</td>
<td align="char" char=".">99.00</td>
<td align="char" char=".">97.22</td>
<td align="char" char=".">95.19</td>
<td align="char" char=".">99.70</td>
<td align="char" char=".">95.71</td>
<td align="char" char=".">0.96</td>
</tr>
<tr>
<td align="center">18</td>
<td align="left">hsa-miR-4454</td>
<td align="char" char=".">45.05</td>
<td align="char" char=".">95.00</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">95.00</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">98.10</td>
<td align="char" char=".">97.14</td>
<td align="char" char=".">0.97</td>
</tr>
<tr>
<td align="center">19</td>
<td align="left">hsa-miR-6760-5p</td>
<td align="char" char=".">45.42</td>
<td align="char" char=".">90.00</td>
<td align="char" char=".">94.00</td>
<td align="char" char=".">85.71</td>
<td align="char" char=".">95.92</td>
<td align="char" char=".">98.58</td>
<td align="char" char=".">92.86</td>
<td align="char" char=".">0.93</td>
</tr>
<tr>
<td align="center">20</td>
<td align="left">hsa-miR-668-5p</td>
<td align="char" char=".">45.24</td>
<td align="char" char=".">77.50</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">93.94</td>
<td align="char" char=".">91.59</td>
<td align="char" char=".">96.44</td>
<td align="char" char=".">92.14</td>
<td align="char" char=".">0.92</td>
</tr>
<tr>
<td align="center">21</td>
<td align="left">hsa-miR-6762-5p</td>
<td align="char" char=".">42.09</td>
<td align="char" char=".">45.00</td>
<td align="char" char=".">92.00</td>
<td align="char" char=".">69.23</td>
<td align="char" char=".">80.70</td>
<td align="char" char=".">88.94</td>
<td align="char" char=".">78.57</td>
<td align="char" char=".">0.79</td>
</tr>
<tr>
<td align="center">22</td>
<td align="left">hsa-miR-3191-3p</td>
<td align="char" char=".">40.43</td>
<td align="char" char=".">75.00</td>
<td align="char" char=".">94.00</td>
<td align="char" char=".">83.33</td>
<td align="char" char=".">90.38</td>
<td align="char" char=".">93.48</td>
<td align="char" char=".">88.57</td>
<td align="char" char=".">0.89</td>
</tr>
<tr>
<td align="center">23</td>
<td align="left">hsa-miR-1268b</td>
<td align="char" char=".">39.32</td>
<td align="char" char=".">70.00</td>
<td align="char" char=".">94.00</td>
<td align="char" char=".">82.35</td>
<td align="char" char=".">88.68</td>
<td align="char" char=".">93.91</td>
<td align="char" char=".">87.14</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="center">24</td>
<td align="left">hsa-miR-1185-2-3p</td>
<td align="char" char=".">39.13</td>
<td align="char" char=".">30.00</td>
<td align="char" char=".">87.00</td>
<td align="char" char=".">48.00</td>
<td align="char" char=".">75.65</td>
<td align="char" char=".">53.88</td>
<td align="char" char=".">70.71</td>
<td align="char" char=".">0.71</td>
</tr>
<tr>
<td align="center">25</td>
<td align="left">hsa-miR-6131</td>
<td align="char" char=".">38.30</td>
<td align="char" char=".">87.50</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">94.59</td>
<td align="char" char=".">95.15</td>
<td align="char" char=".">99.21</td>
<td align="char" char=".">95.00</td>
<td align="char" char=".">0.95</td>
</tr>
<tr>
<td align="center">26</td>
<td align="left">hsa-miR-920</td>
<td align="char" char=".">38.39</td>
<td align="char" char=".">87.50</td>
<td align="char" char=".">96.00</td>
<td align="char" char=".">89.74</td>
<td align="char" char=".">95.05</td>
<td align="char" char=".">98.26</td>
<td align="char" char=".">93.57</td>
<td align="char" char=".">0.94</td>
</tr>
<tr>
<td align="center">27</td>
<td align="left">hsa-miR-4635</td>
<td align="char" char=".">38.02</td>
<td align="char" char=".">77.50</td>
<td align="char" char=".">98.00</td>
<td align="char" char=".">93.94</td>
<td align="char" char=".">91.59</td>
<td align="char" char=".">95.38</td>
<td align="char" char=".">92.14</td>
<td align="char" char=".">0.92</td>
</tr>
<tr>
<td align="center">28</td>
<td align="left">hsa-miR-6724-5p</td>
<td align="char" char=".">37.28</td>
<td align="char" char=".">45.00</td>
<td align="char" char=".">81.00</td>
<td align="char" char=".">48.65</td>
<td align="char" char=".">78.64</td>
<td align="char" char=".">74.35</td>
<td align="char" char=".">70.71</td>
<td align="char" char=".">0.71</td>
</tr>
<tr>
<td align="center">29</td>
<td align="left">hsa-miR-1185-1-3p</td>
<td align="char" char=".">37.19</td>
<td align="char" char=".">20.00</td>
<td align="char" char=".">85.00</td>
<td align="char" char=".">34.78</td>
<td align="char" char=".">72.65</td>
<td align="char" char=".">54.70</td>
<td align="char" char=".">66.43</td>
<td align="char" char=".">0.66</td>
</tr>
<tr>
<td align="center">30</td>
<td align="left">hsa-miR-422a</td>
<td align="char" char=".">38.02</td>
<td align="char" char=".">55.00</td>
<td align="char" char=".">87.00</td>
<td align="char" char=".">62.86</td>
<td align="char" char=".">82.86</td>
<td align="char" char=".">72.94</td>
<td align="char" char=".">77.86</td>
<td align="char" char=".">0.78</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The balanced training data using SMOTE random oversampling technique had 1,376 cancer cases and 1,498&#x20;non-cancer controls. We trained DT, RF, LR, XGBT, and ANN perdition models with the selected miRNAs in the balanced training&#x20;data.</p>
</sec>
<sec id="s3-2">
<title>Prediction Models and Accuracy in the Validation Data</title>
<p>The external validation data GSE113486 had 40 (28.6%) gastric cancer and 100 (71.4%) non-cancer (controls). hsa-miR-1343-3 produced the highest prediction accuracy for GC prediction (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). For the hsa-miR-1343-3, all of the accuracy measures including AUC, sensitivity and specificity, positive predictive value, negative predictive value, Kappa were 100%. According to the decision trees, the cut-off point for this miRNA was 8.2 (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). Further, hsa-miR-8073 and hsa-miR-1228-5p produced 100% AUC but other accuracy measures were not 100%. On the other hsa-miR-1185-1-3p had the lowest AUC which has the least contribution to the prediction of&#x20;GC.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Boxplot of the selected miRNA from Boruta Algorithm. <bold>(A)</bold>, hsa-miR-1228-5p; <bold>(B)</bold>, hsa-miR-8073; <bold>(C)</bold>, hsa-miR-6746-5p; <bold>(D)</bold>, hsa-miR-5100; <bold>(E)</bold>, hsa-miR-4532; <bold>(F)</bold>: hsa-miR-1343-3p; <bold>(G)</bold>, hsa-miR-1290.</p>
</caption>
<graphic xlink:href="fgene-12-779455-g001.tif"/>
</fig>
<p>Among several models discussed in the study, the XGBT algorithm had better prediction accuracy overall (Table S1-S4). However, for hsa-miR-1343-3 all models had consistently 100% accuracy which indicates that this miRNA may strongly predict GC. For some miRNA such as hsa-miR-422a XGBT algorithm could predict GC with higher accuracy than the logistic regression and decision trees. <xref ref-type="fig" rid="F2">Figure&#x20;2</xref> shows the correlation of the important miRNAs. It can be observed that most of the identified miRNAs except hsa-miR-422a, hsa-miR-1185-1-3p, hsa-miR-1185-2-3p, hsa-miR-6087, and hsa-miR-1199-5p are highly correlated. Consequently, clustering of correlated those miRNAs is helpful for the identification of cancerous and non-cancerous patients. Finally, Heatmap plot indicates the result of the hierarchical clustering analysis of the 30 selected miRNAs, which represents that identified miRNAs can easily distinguish GC cases and controls in test sample obtained from GSE113486 dataset (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Correlation plot of the selected miRNAs. Dark blue and dark red shows the strength of the correlations between miRNAs.</p>
</caption>
<graphic xlink:href="fgene-12-779455-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Heathmap plot of clustering of 30 selected miRNAs.</p>
</caption>
<graphic xlink:href="fgene-12-779455-g003.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Ontological Analysis</title>
<p>Regulatory, functional, and perturbation analysis by GeneCodis 4 showed that 30 identified miRNAs (<xref ref-type="table" rid="T1">Table&#x20;1</xref>) are related strongly to the cancer-associated genes and molecular events (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>). Visualizations generated for 10 top terms of associations with Transcription Factors (<xref ref-type="fig" rid="F4">Figure&#x20;4A</xref>), co-annotation of HMDD v3 (the Human microRNA disease database), MNDR (Mammalian ncRNA-Disease Repository), and TAM2 (The tool for annotations of human miRNAs) databases (<xref ref-type="fig" rid="F4">Figure&#x20;4B</xref>), GO (Gene Ontology and GO Annotations) Biological Process (<xref ref-type="fig" rid="F4">Figure&#x20;4C</xref>), GO Molecular Function (<xref ref-type="fig" rid="F4">Figure&#x20;4D</xref>), co-annotation of KEGG (Kyoto Encyclopedia of Genes and Genomes) Pathways, Panther (Protein ANalysis THrough Evolutionary Relationships) Pathways, and WikiPathways (<xref ref-type="fig" rid="F4">Figure&#x20;4E</xref>), and co-annotation of HPO (The Human Phenotype Ontology) and OMIM (Online Mendelian Inheritance in Man) databases (<xref ref-type="fig" rid="F4">Figure&#x20;4F</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>GeneCodis Ontological analysis. Visualizations generated for 10 top terms of related categories with our identified miRNAs list are presented here for Transcription Factors <bold>(A)</bold>, Co-annotation of miRNAs-based analysis using HMDD v3, MNDR, and TAM2&#x20;<bold>(B)</bold>, GO Biological Process <bold>(C)</bold>, GO Molecular Function <bold>(D)</bold>, Co-annotation of KEGG Pathways, Panther Pathways, and WikiPathways databases <bold>(E)</bold>, and Co-annotation of HPO and OMIM databases <bold>(F)</bold>.</p>
</caption>
<graphic xlink:href="fgene-12-779455-g004.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Using artificial intelligence technology, we identified hsa-miR-1343-3 as a very strong nominate for biomarker analysis of GC diagnosis. The value of hsa-miR-1343-3 higher than 8.2 indicates that it could be a strong predictor for GC (100% of AUC, 100% of Sensitivity and Sepecificity). We also found three other miRNAs (hsa-miR-8073 and hsa-miR-1228-5p) with a great contribution to the GC prediction. A medical expert can use these findings for the early detection of GC instead of using costly and time-consuming tools such as colonoscopy Yao et <italic>al.</italic> (<xref ref-type="bibr" rid="B56">Yao, 2020</xref>).</p>
<p>This study had several strengths compared to the previous studies. Compared to Shi et&#x20;al. that identified the miR-1246 as the potential biomarker of GC that generated the AUC of 83%, our study identified the hsa-miR-1343-3p using the Boruta algorithm that led to a significant increase in the AUC (<xref ref-type="bibr" rid="B42">Shi and Zhang, 2019</xref>). The study of Yao et&#x20;al., selected three miRNAs that produced similar precision to our study that using only single miRNA that may have economical merits. Further, their study used a limited sample size (70 gastric cancer patients and 374&#x20;non-cancer controls) in the training set that may lead to an inferior model. The current study used very advanced variable selection methods and the state of the art machine learning approaches that produced consistent results. Another merit of the study is introducing a simple cut-off point of 8.2 using decision trees that may has very practical value in GC classification.</p>
<p>
<xref ref-type="fig" rid="F4">Figure&#x20;4A</xref> depicted that among the transcription factors related to the genes associated with the identified miRNAs list (<xref ref-type="table" rid="T1">Table&#x20;1</xref>) the SP1, MYC, and E2F1 have higher priorities. SP1 protein expression is up regulated in GC tissues compared with normal tissues and is positively associated with depth of invasion and TNM stage of GC (<xref ref-type="bibr" rid="B42">Shi and Zhang, 2019</xref>). MYC is an oncogene responsible for excessive cell growth in cancer, enabling transcriptional activation of genes involved in cell cycle regulation, metabolism, and apoptosis, and is usually overexpressed in GC (<xref ref-type="bibr" rid="B38">Mau&#xe9;s, 2018</xref>). E2F1 is a member of the E2F family that functions in cell cycle progression and apoptosis induction in response to DNA damage. Deregulated E2F1 acts as a driving force in GC progression and promotes tumor invasion and metastasis independently from its other cellular activities (<xref ref-type="bibr" rid="B55">Yan, 2014</xref>).</p>
<p>As depicted in <xref ref-type="fig" rid="F4">Figure&#x20;4B</xref> gastrointestinal cancers including hepatocellular cancer, colon cancer, biliary tract cancer, and especially early-stage GC are among the most related diseases to the analyzed miRNAs list. From biological process and molecular function perspectives as showed in <xref ref-type="fig" rid="F4">Figures 4C,D</xref>, the regulation of transcription and gene expression, and protein and DNA binding are the most targeted aspects, which are the general aspects of molecular biology of GC (<xref ref-type="bibr" rid="B7">Cervantes et&#x20;al., 2007</xref>; <xref ref-type="bibr" rid="B50">Vauhkonen et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B46">Tan and Yeoh, 2015</xref>). Co-annotation of three pathway databases (<xref ref-type="fig" rid="F4">Figure&#x20;4E</xref>) has shown that the miRNAs list is general in relation with pathways in cancer, VEGFA-VEGFR2 signaling pathway and PI3K-Akt signaling pathway. The increased expression of VEGFA in the tubular glands and VEGFR2 in the endothelium of GC samples mainly in the T2, T3 and T4 stages of tumor progression has been reported previously (<xref ref-type="bibr" rid="B45">Tamma, 2018</xref>). Also, it is showed that the PI3K/AKT/mTOR pathway is activated in GC with overexpression in tumor tissue, which is correlated with the depth of tumor infiltration and the presence of lymph node metastases (<xref ref-type="bibr" rid="B47">Tapia, 2014</xref>). Surprisingly, relation with Human cytomegalovirus infection, which was identified in our pathway analysis, has been reported to be associated with the development of GC (<xref ref-type="bibr" rid="B30">Jin, 2014</xref>) and GC lymphatic metastasis (<xref ref-type="bibr" rid="B63">Zhang, 2017</xref>).</p>
<p>The analysis of human phenotype and Mendelian inheritance ontologies identified Autosomal dominant inheritance and Global developmental delay among the most related phenomena with our miRNAs list. It is reported that gastric adenocarcinoma and proximal polyposis of the stomach is an autosomal dominant syndrome (<xref ref-type="bibr" rid="B54">Worthley, 2012</xref>). Also, some common variants have been described for GC and developmental delay (<xref ref-type="bibr" rid="B23">Hansford, 2015</xref>; <xref ref-type="bibr" rid="B61">Zhang, 2020</xref>).</p>
<p>In our study, we have shown theoreticaly that ther is a strong relationship between hsa-miR-1343-3p and GC. Hsa-miR-1343-3p has been indicated as a tumor suppressor for many types of cancer. It has been suggested that miR-1343-3p, which regulates the oncogenic effect of TEA domain transcription factors is associated with GC (<xref ref-type="bibr" rid="B65">Zhou, 2017</xref>). The correlation between hsa-miR-1343-3p and lung adenocarcinoma was evaluated and its expression was found to be low in patients with vascular invasion (<xref ref-type="bibr" rid="B31">Kim, 2017</xref>). Yuan et&#x20;al. demonstrated that hsa-miR-1343-3p is consistently down-regulated in colon, prostate, and pancreatic cancers. Also, hsa-miR-1343-3p has been proposed as a biomarker to distinguish pancreato-biliary malignancy from non-malignant diseases. The major genes targeted by miR-1343-3p have been identified (<xref ref-type="bibr" rid="B59">Yuan, 2016</xref>). In this context, these target genes and their interaction with GC should also be investigated. The hsa-miR-1343-3p targets including SHISA7, TGFBR1, DLGAP3, SPRED1, ATXN7L3, and PLXDC2 genes are listed at MIRDB (<ext-link ext-link-type="uri" xlink:href="http://mirdb.org/">http://mirdb.org/</ext-link>). Among them transforming growth factor beta-1 (TGF&#x3b2;1) play an important role in carcinogenesis upon binding its receptor (TGFBR1). It acts as a tumor suppressor by inhibiting cellular proliferation or by promoting cellular differentiation and apoptosis. However, it turns to be a tumor promoter by stimulating angiogenesis and cell motility, suppressing the immune response, and increasing progressive invasion and metastasis (<xref ref-type="bibr" rid="B59">Yuan, 2016</xref>). Other reports have also revealed that hsa-miR-1343-3p reduces the expression of transforming growth factor-&#x3b2; (TGF-&#x3b2;) receptor-1, which induces angiogenesis through vascular endothelial growth factor (VEGF)-mediated apoptosis. Therefore, hsa-miR-1343-3p may also play an anti-angiogenic role (<xref ref-type="bibr" rid="B17">Ferrari et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B43">Stolzenburg et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B31">Kim, 2017</xref>). He et&#x20;al. determined that TGFBR1 genes&#x2019; two polymorphisms (rs334348, rs10512263) were associated with the risk of GC (<xref ref-type="bibr" rid="B26">He, 2018</xref>). In another study, Zhang et&#x20;al. have shown that silencing of TGFBR1 inhibited cell proliferation, migration, invasion, and EMT in GC&#xa0;cells (<xref ref-type="bibr" rid="B62">Zhang, 2019</xref>).</p>
<p>Discs large associated proteins (DLGAPs) family has been implicated in psychological and neurological diseases. However, few studies have explored the association between the expression of DLGAPs and different types of cancer. Liu et&#x20;al. has suggested that the significant overexpression of DLGAP4 in GC may be a promising potential prognostic marker for GC (<xref ref-type="bibr" rid="B36">Liu et&#x20;al., 2018</xref>). Aslo, Liu et&#x20;al. have determined decreased expression of SPRED1 in GC tissues (<xref ref-type="bibr" rid="B37">Liu et&#x20;al., 2020</xref>).</p>
<p>However, there were certain limitations in our study. We had relatively small sample size in GC group. Other limitations were the pathological information such as the tumor stage, age or other factors which were not available in our datasets. Nonetheless, the prediction accuracy of our model has high enough (100% AUC) for clinical use. Further, we were unable to do the survival analysis to further validate the markers identified in this paper based on public available data (<xref ref-type="bibr" rid="B27">Howlader, 2014</xref>).</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>Using several state of the art machine learning methods and Boruta algorithm, we identified several miRNAs that can predict GC. Specifically, hsa-miR-1343-3p, which identified by cut-off point of 8.2 may be nominated as a highly reliable biomarker for, GC diagnosis after meticulous empirical&#x20;tests.</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/">https://www.ncbi.nlm.nih.gov/geo/</ext-link>.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>NG and RB conducted this study and performed statistical analysis and machine learning models. YA and TE provided ontological analysis. The paper was reviewed by EF and MS before final submission.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We would like to thank the Associate Editor and three anonymous expert reviewers who significantly helped to improve the presentation of the&#x20;paper.</p>
</ack>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.779455/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.779455/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.DOCX" id="SM1" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aftabi</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Long Non&#x2010;coding RNAs as Potential Biomarkers in the Prognosis and Diagnosis of Lung Cancer: A Review and Target Analysis</article-title>. <volume>73</volume>, <fpage>307</fpage>&#x2013;<lpage>327</lpage>. <pub-id pub-id-type="doi">10.1002/iub.2430</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Alpaydin</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <source>Introduction to Machine Learning</source>. <publisher-name>MIT press</publisher-name>. </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bartel</surname>
<given-names>D. P.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>MicroRNAs: Genomics, Biogenesis, Mechanism, and Function</article-title>. <source>cell</source> <volume>116</volume>, <fpage>281</fpage>&#x2013;<lpage>297</lpage>. <pub-id pub-id-type="doi">10.1016/s0092-8674(04)00045-5</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bray</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Global Cancer Statistics 2018: GLOBOCAN Estimates of Incidence and Mortality Worldwide for 36 Cancers in 185 Countries</article-title>. <source>CA: a Cancer J.&#x20;clinicians</source> <volume>68</volume>, <fpage>394</fpage>&#x2013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.3322/caac.21492</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Caldas</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Brenton</surname>
<given-names>J.&#x20;D.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Sizing up miRNAs as Cancer Genes</article-title>. <source>Nat. Med.</source> <volume>11</volume>, <fpage>712</fpage>&#x2013;<lpage>714</lpage>. <pub-id pub-id-type="doi">10.1038/nm0705-712</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carpelan-Holmstr&#xf6;m</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Louhimo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Stenman</surname>
<given-names>U.-H.</given-names>
</name>
<name>
<surname>Alfthan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Haglund</surname>
<given-names>C. C. E. A.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>CA 19-9 and CA 72-4 Improve the Diagnostic Accuracy in Gastrointestinal Cancers</article-title>. <source>Anticancer Res.</source> <volume>22</volume>, <fpage>2311</fpage>&#x2013;<lpage>2316</lpage>. </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cervantes</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Braun</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Fidalgo</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Gonz&#xe1;lez</surname>
<given-names>I. C. J.&#x20;C.</given-names>
</name>
<name>
<surname>Oncology</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2007</year>). <source>Mol. Biol. gastric Cancer</source> <volume>9</volume>, <fpage>208</fpage>&#x2013;<lpage>215</lpage>. <pub-id pub-id-type="doi">10.1007/s12094-007-0041-4</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choi</surname>
<given-names>I. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Long-term Outcome Comparison of Endoscopic Resection and Surgery in Early Gastric Cancer Meeting the Absolute Indication for Endoscopic Resection</article-title>. <source>Gastrointest. Endosc.</source> <volume>81</volume>, <fpage>333</fpage>&#x2013;<lpage>341</lpage>. <pub-id pub-id-type="doi">10.1016/j.gie.2014.07.047</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bastien</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Introduction to General Optimization Principles and Methods</article-title>. <source>Nonlinear Optimization Vehicle Saf. Structures</source>, <fpage>107</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1016/b978-0-12-417297-5.00003-1</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cleophas</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Zwinderman</surname>
<given-names>A. H.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Machine Learning in Medicine-A Complete Overview</source>. <publisher-name>Springer</publisher-name>. </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Gastric Juice MicroRNAs as Potential Biomarkers for the Screening of Gastric Cancer</article-title>. <source>Cancer</source> <volume>119</volume>, <fpage>1618</fpage>&#x2013;<lpage>1626</lpage>. <pub-id pub-id-type="doi">10.1002/cncr.27903</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Darsey</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Griffin</surname>
<given-names>W. O.</given-names>
</name>
<name>
<surname>Joginipelli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Melapu</surname>
<given-names>V. K.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Artificial Neural Networks 269-283</source>. <publisher-name>Springer</publisher-name>. </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeGregory</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A Review of Machine Learning in Obesity</article-title>. <source>Obes. Rev.</source> <volume>19</volume>, <fpage>668</fpage>&#x2013;<lpage>685</lpage>. <pub-id pub-id-type="doi">10.1111/obr.12667</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deo</surname>
<given-names>R. C.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Machine Learning in Medicine</article-title>. <source>Circulation</source> <volume>132</volume>, <fpage>1920</fpage>&#x2013;<lpage>1930</lpage>. <pub-id pub-id-type="doi">10.1161/circulationaha.115.001593</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dieckmann</surname>
<given-names>K.-P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Serum Levels of microRNA-371a-3p (M371 Test) as a New Biomarker of Testicular Germ Cell Tumors: Results of a Prospective Multicentric Study</article-title>. <source>J.&#x20;Clin. Oncol.</source> <volume>37</volume>, <fpage>1412</fpage>. <pub-id pub-id-type="doi">10.1200/jco.18.01480</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fakhari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gharepapagh</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Dabiri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gilani</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Correlation of Cancer Antigen 15-3 (CA15-3) Serum Level and Bony Metastases in Breast Cancer Patients</article-title>. <source>Med. J.&#x20;Islamic Republic Iran</source> <volume>33</volume>, <fpage>142</fpage>. <pub-id pub-id-type="doi">10.47176/mjiri.33.142</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferrari</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Cook</surname>
<given-names>B. D.</given-names>
</name>
<name>
<surname>Terushkin</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Pintucci</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Mignatti</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Transforming Growth Factor&#x2010;beta 1 (TGF&#x2010;&#x3b2;1) Induces Angiogenesis through Vascular Endothelial Growth Factor (VEGF)&#x2010;mediated Apoptosis</article-title>. <source>J.&#x20;Cell. Physiol.</source> <volume>219</volume>, <fpage>449</fpage>&#x2013;<lpage>458</lpage>. <pub-id pub-id-type="doi">10.1002/jcp.21706</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Garcia-Moreno</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <source>GeneCodis 4: Expanding the Modular Enrichment Analysis to Regulatory Elements</source>. </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilad</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Serum microRNAs Are Promising Novel Biomarkers</article-title>. <source>PloS one</source> <volume>3</volume>, <fpage>e3148</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0003148</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gilani</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Esmaeili</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Haghshenas</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <source>The Effect of Eight Weeks Concurrent Training and Supplementation of L_Arginine on Plasma Level of 8-hydroxydeoxyguanosine (8-OHdG), Malondialdehyde and Total Antioxidant Capacity in Elderly Men (Multivariate Longitudinal Modeling)</source>. </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilani</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Haghshenas</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Esmaeili</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Application of Multivariate Longitudinal Models in SIRT6, FBS, and BMI Analysis of the Elderly</article-title>. <source>The Aging Male</source> <volume>22</volume>, <fpage>260</fpage>&#x2013;<lpage>265</lpage>. <pub-id pub-id-type="doi">10.1080/13685538.2018.1477933</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gilani</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Kazemnejad</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zayeri</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Asghari</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Izadi</surname>
<given-names>A. F. S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Predicting Outcomes in Traumatic Brain Injury Using the glasgow Coma Scale: A Joint Modeling of Longitudinal Measurements and Time to Event</article-title>. <source>Iran Red Crescent Med J</source> <volume>19</volume> (<issue>2</issue>), <fpage>e29663</fpage>. </citation>
</ref>
<ref id="B23">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hansford</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Hereditary Diffuse Gastric Cancer Syndrome: CDH1 Mutations and beyond</source>. <volume>1</volume>, <fpage>23</fpage>&#x2013;<lpage>32</lpage>. </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hartgrink</surname>
<given-names>H. H.</given-names>
</name>
<name>
<surname>Jansen</surname>
<given-names>E. P.</given-names>
</name>
<name>
<surname>van Grieken</surname>
<given-names>N. C.</given-names>
</name>
<name>
<surname>van de Velde</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Gastric Cancer</article-title>. <source>Lancet (London, England)</source> <volume>374</volume>, <fpage>477</fpage>&#x2013;<lpage>490</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(09)60617-6</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2009</year>). <source>The Elements of Statistical Learning: Data Mining, Inference, and Prediction</source>. <publisher-loc>Switzerland AG</publisher-loc>: <publisher-name>Springer Science &#x26; Business Media</publisher-name>. </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Polymorphisms of TGFBR1, TLR4 Are Associated with Prognosis of Gastric Cancer in a Chinese Population</article-title>. <source>Cancer Cel. Int.</source> <volume>18</volume>, <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/s12935-018-0682-0</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Howlader</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2014</year>). <source>SEER Cancer Statistics Review, 1975&#x2013;2011</source>, <volume>19</volume>. <publisher-loc>Bethesda, MD</publisher-loc>: <publisher-name>National Cancer Institute</publisher-name>. </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hundahl</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Phillips</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Menck</surname>
<given-names>H. R.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>The National Cancer Data Base Report on Poor Survival of US Gastric Carcinoma Patients Treated with Gastrectomy: American Joint Committee on Cancer Staging, Proximal Disease, and the &#x201c;Different Disease&#x201d; Hypothesis</article-title>. <source>Cancer</source> <volume>88</volume>, <fpage>921</fpage>&#x2013;<lpage>932</lpage>. <pub-id pub-id-type="doi">10.1002/(sici)1097-0142(20000215)88:4&#x3c;921:aid-cncr24&#x3e;3.0.co;2-s</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>James</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Witten</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2013</year>). <source>An Introduction to Statistical Learning</source>, <volume>Vol. 112</volume>. <publisher-name>Springer</publisher-name>. </citation>
</ref>
<ref id="B30">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Jin</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <source>Latent Infection of Human Cytomegalovirus Is Associated with the Development of Gastric Cancer</source>, <volume>8</volume>, <fpage>898</fpage>&#x2013;<lpage>904</lpage>. <pub-id pub-id-type="doi">10.3892/ol.2014.2148</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>MicroRNA Expression Profiles and Clinicopathological Implications in Lung Adenocarcinoma According to EGFR, KRAS, and ALK Status</article-title>. <source>Oncotarget</source> <volume>8</volume>, <fpage>8484</fpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.14298</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kursa</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Rudnicki</surname>
<given-names>W. R.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Wrapper Algorithm for All Relevant Feature Selection</source>. <publisher-loc>Boruta</publisher-loc>: <publisher-name>CRAN-Package</publisher-name>. </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Tumor-secreted Exosomal miR-222 Promotes Tumor Progression via Regulating P27 Expression and Re-localization in Pancreatic Cancer</article-title>. <source>Cell Physiol. Biochem.</source> <volume>51</volume>, <fpage>610</fpage>&#x2013;<lpage>629</lpage>. <pub-id pub-id-type="doi">10.1159/000495281</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>X.-J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A Serum microRNA Classifier for Early Detection of Hepatocellular Carcinoma: a Multicentre, Retrospective, Longitudinal Biomarker Identification Study with a Nested Case-Control Study</article-title>. <source>Lancet Oncol.</source> <volume>16</volume>, <fpage>804</fpage>&#x2013;<lpage>815</lpage>. <pub-id pub-id-type="doi">10.1016/s1470-2045(15)00048-0</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Link</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kupcinskas</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>MicroRNAs as Non-invasive Diagnostic Biomarkers for Gastric Cancer: Current Insights and Future Perspectives</article-title>. <source>World J.&#x20;Gastroenterol.</source> <volume>24</volume>, <fpage>3313</fpage>. <pub-id pub-id-type="doi">10.3748/wjg.v24.i30.3313</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Examination of the Expression and Prognostic Significance of DLGAPs in Gastric Cancer Using the TCGA Database and Bioinformatic Analysis</article-title>. <source>Mol. Med. Rep.</source> <volume>18</volume>, <fpage>5621</fpage>&#x2013;<lpage>5629</lpage>. <pub-id pub-id-type="doi">10.3892/mmr.2018.9574</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <source>A Study on the Expression of SPRED1 and PBRM1 (Baf180) and Their Clinical Significances in Patients with Gastric Cancer</source>, <volume>66</volume>. <publisher-name>Clinical Laboratory</publisher-name>. <pub-id pub-id-type="doi">10.7754/clin.lab.2020.200312</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Mau&#xe9;s</surname>
<given-names>J.&#x20;H. d. S.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Gastric Cancer Cell Lines Have Different MYC-Regulated Expression Patterns but Share a Common Core of Altered Genes</source>. </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moons</surname>
<given-names>K. G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis (TRIPOD): Explanation and Elaboration</article-title>. <source>Ann. Intern. Med.</source> <volume>162</volume>, <fpage>W1</fpage>&#x2013;<lpage>W73</lpage>. <pub-id pub-id-type="doi">10.7326/m14-0698</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Penon</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cito</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Giordano</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Novel Findings about Management of Gastric Cancer: a Summary from 10th IGCC</article-title>. <source>World J.&#x20;Gastroenterol. WJG</source> <volume>20</volume>, <fpage>8986</fpage>. <pub-id pub-id-type="doi">10.3748/wjg.v20.i27.8986</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shahid</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Rappon</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Berta</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Applications of Artificial Neural Networks in Health Care Organizational Decision-Making: A Scoping Review</article-title>. <source>PloS one</source> <volume>14</volume>, <fpage>e0212356</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0212356</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z. G. J.&#x20;O. l.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Role of Sp1 Expression in Gastric Cancer: A Meta-Analysis and Bioinformatics Analysis</article-title>. <volume>18</volume>, <fpage>4126</fpage>&#x2013;<lpage>4135</lpage>. <pub-id pub-id-type="doi">10.3892/ol.2019.10775</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stolzenburg</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Wachtel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Harris</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>miR-1343 Attenuates Pathways of Fibrosis by Targeting the TGF-&#x3b2; Receptors</article-title>. <source>Biochem. J.</source> <volume>473</volume>, <fpage>245</fpage>&#x2013;<lpage>256</lpage>. <pub-id pub-id-type="doi">10.1042/bj20150821</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname>
<given-names>Z.-X.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Diagnostic and Prognostic Value of Circulating miR-18a in the Plasma of Patients with Gastric Cancer</article-title>. <source>Tumor Biol.</source> <volume>35</volume>, <fpage>12119</fpage>&#x2013;<lpage>12125</lpage>. <pub-id pub-id-type="doi">10.1007/s13277-014-2516-6</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tamma</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <source>VEGFA and VEGFR2 RNAscope Determination in Gastric Cancer</source>, <volume>49</volume>, <fpage>429</fpage>&#x2013;<lpage>435</lpage>. <pub-id pub-id-type="doi">10.1007/s10735-018-9777-0</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Yeoh</surname>
<given-names>K.-G. J.&#x20;G.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Genet. Mol. pathogenesis gastric adenocarcinoma</source> <volume>149</volume>, <fpage>1153</fpage>&#x2013;<lpage>1162</lpage>. <pub-id pub-id-type="doi">10.1053/j.gastro.2015.05.059</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tapia</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>The PI3K/AKT/mTOR Pathway Is Activated in Gastric Cancer with Potential Prognostic and Predictive Significance</article-title>. <volume>465</volume>, <fpage>25</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1007/s00428-014-1588-4</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Usuba</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Circulating miRNA Panels for Specific and Early Detection in Bladder Cancer</article-title>. <source>Cancer Sci.</source> <volume>110</volume>, <fpage>408</fpage>. <pub-id pub-id-type="doi">10.1111/cas.13856</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Usuba</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Circulating miRNA Panels for Specific and Early Detection in Bladder Cancer</article-title>. <volume>110</volume>, <fpage>408</fpage>&#x2013;<lpage>419</lpage>. <pub-id pub-id-type="doi">10.1111/cas.13856</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Vauhkonen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Vauhkonen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sipponen</surname>
<given-names>P. J.&#x20;B. P.</given-names>
</name>
<name>
<surname>Gastroenterology</surname>
<given-names>R. C.</given-names>
</name>
</person-group> (<year>2006</year>). <source>Pathology and Molecular Biology of Gastric Cancer</source>, <volume>20</volume>, <fpage>651</fpage>&#x2013;<lpage>674</lpage>. <pub-id pub-id-type="doi">10.1016/j.bpg.2006.03.016</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Veitch</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Uedo</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>East</surname>
<given-names>J.&#x20;E.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Optimizing Early Upper Gastrointestinal Cancer Detection at Endoscopy</article-title>. <source>Nat. Rev. Gastroenterol. Hepatol.</source> <volume>12</volume>, <fpage>660</fpage>. <pub-id pub-id-type="doi">10.1038/nrgastro.2015.128</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The Diagnostic Value of Circulating microRNAs as a Biomarker for Gastric Cancer: A Meta-Analysis</article-title>. <source>Oncol. Rep.</source> <volume>41</volume>, <fpage>87</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.3892/or.2018.6782</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wiemken</surname>
<given-names>T. L.</given-names>
</name>
<name>
<surname>Kelley</surname>
<given-names>R. R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Machine Learning in Epidemiology and Health Outcomes Research</article-title>. <source>Annu. Rev. Public Health</source> <volume>41</volume>, <fpage>21</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-publhealth-040119-094437</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Worthley</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Gastric Adenocarcinoma and Proximal Polyposis of the Stomach (GAPPS): a New Autosomal Dominant Syndrome</article-title>. <volume>61</volume>, <fpage>774</fpage>&#x2013;<lpage>779</lpage>. <pub-id pub-id-type="doi">10.1136/gutjnl-2011-300348</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>L.-H.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Overexpression of E2F1 in Human Gastric Carcinoma Is Involved in Anti-cancer Drug Resistance</article-title>. <volume>14</volume>, <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2407-14-904</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Identification of Serum Circulating MicroRNAs as Novel Diagnostic Biomarkers of Gastric Cancer</article-title>. <source>Front. Genet.</source> <volume>11</volume>, <fpage>515</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2020.591515</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yokoi</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Integrated Extracellular microRNA Profiling for Ovarian Cancer Screening</article-title>. <source>Nat. Commun.</source> <volume>9</volume>, <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-06434-4</pub-id> </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoshimura</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Exosomal miR-99a-5p Is Elevated in Sera of Ovarian Cancer Patients and Promotes Cancer Cell Invasion by Increasing Fibronectin and Vitronectin Expression in Neighboring Peritoneal Mesothelial Cells</article-title>. <source>BMC cancer</source> <volume>18</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1186/s12885-018-4974-5</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Plasma Extracellular RNA Profiles in Healthy and Cancer Patients</article-title>. <source>Scientific Rep.</source> <volume>6</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1038/srep19413</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Cancer-derived Exosomal miR-25-3p Promotes Pre-metastatic Niche Formation by Inducing Vascular Permeability and Angiogenesis</article-title>. <source>Nat. Commun.</source> <volume>9</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-07810-w</pub-id> </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>YARS as an Oncogenic Protein that Promotes Gastric Cancer Progression through Activating PI3K-Akt Signaling</article-title>. <volume>146</volume>, <fpage>329</fpage>&#x2013;<lpage>342</lpage>. <pub-id pub-id-type="doi">10.1007/s00432-019-03115-7</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Circular RNA CircCACTIN Promotes Gastric Cancer Progression by Sponging MiR-331-3p and Regulating TGFBR1 Expression</article-title>. <source>Int. J.&#x20;Biol. Sci.</source> <volume>15</volume>, <fpage>1091</fpage>. <pub-id pub-id-type="doi">10.7150/ijbs.31533</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Human Cytomegalovirus Detection in Gastric Cancer and its Possible Association with Lymphatic Metastasis</article-title>. <volume>88</volume>, <fpage>62</fpage>&#x2013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.1016/j.diagmicrobio.2017.02.001</pub-id> </citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Detection of Circulating Tumor Cells in Peripheral Blood from Patients with Gastric Cancer Using microRNA as a Marker</article-title>. <source>J.&#x20;Mol. Med.</source> <volume>88</volume>, <fpage>709</fpage>&#x2013;<lpage>717</lpage>. <pub-id pub-id-type="doi">10.1007/s00109-010-0617-2</pub-id> </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>TEAD1/4 Exerts Oncogenic Role and Is Negatively Regulated by miR-4269 in Gastric Tumorigenesis</article-title>. <source>Oncogene</source> <volume>36</volume>, <fpage>6518</fpage>&#x2013;<lpage>6530</lpage>. <pub-id pub-id-type="doi">10.1038/onc.2017.257</pub-id> </citation>
</ref>
<ref id="B66">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Z.-H.</given-names>
</name>
</person-group> (<year>2012</year>). <source>Ensemble Methods: Foundations and Algorithms</source>. <publisher-name>CRC Press</publisher-name>. </citation>
</ref>
</ref-list>
</back>
</article>