<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Earth Sci.</journal-id>
<journal-title>Frontiers in Earth Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Earth Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-6463</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1491334</article-id>
<article-id pub-id-type="doi">10.3389/feart.2025.1491334</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Earth Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Logging-data-driven lithology identification in complex reservoirs: an example from the Niuxintuo block of the Liaohe oilfield</article-title>
<alt-title alt-title-type="left-running-head">Fan et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/feart.2025.1491334">10.3389/feart.2025.1491334</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Fan</surname>
<given-names>Zuochun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Changhao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jiang</surname>
<given-names>Shu</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Man</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cai</surname>
<given-names>Ye</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jiang</surname>
<given-names>Yue</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Yang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2527385/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tian</surname>
<given-names>Mei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Institute of Advanced Studies</institution>, <institution>China University of Geosciences</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Petrochina Liaohe Oilfield Company</institution>, <addr-line>Panjin</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>School of Sustainable Energy</institution>, <institution>China University of Geosciences</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1237463/overview">Hu Li</ext-link>, Sichuan University of Science and Engineering, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1519556/overview">Jianguo Zhang</ext-link>, China University of Geosciences, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2839096/overview">Zikun Zhou</ext-link>, Panzhihua University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Yang Li, <email>7891235@qq.com</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>11</day>
<month>03</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1491334</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>09</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>02</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Fan, Hu, Jiang, Li, Cai, Jiang, Li and Tian.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Fan, Hu, Jiang, Li, Cai, Jiang, Li and Tian</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>For lithologic oil reservoirs, lithology identification plays a significant guiding role in exploration targeting, reservoir evaluation, well network adjustment and optimization, and the establishment of reservoir models. Lithology is usually predicted from well log data based on limited core observations. In recent years, machine learning algorithms have been applied to lithology identification to enhance prediction accuracy. In this paper, five algorithms, including Bayes discriminant analysis, Random Forest (RF), Support Vector Machine (SVM), Back Propagation Neural Network (BPNN), and Convolutional Neural Network (CNN) are evaluated for lithology identification using data from the Niuxintuo reservoir. This reservoir is characterized by complex structural and sedimentary features, strong heterogeneity, and intricate lithological properties, all of which present considerable challenges for well logging identification. First, we conducted a detailed observation of the core lithology. Based on the requirements for reservoir evaluation and the principles of logging identification, we reclassify the lithology of the study area into two categories: clastic rocks and dolomite. The clastic rocks are further subdivided into five rock types: fine sandstone, medium-coarse sandstone, conglomerate, mudstone, and transitional rock. The well log series were selected through sensitivity analysis. Then, Bayes discriminant analysis and four machine learning methods were trained to identify the lithology of the study area. The results indicate that except for Bayes discriminant analysis, all the constructed machine learning classifiers demonstrate high prediction accuracy, with the accuracy rate exceeding 85%. Among them, SVM classifier shows the best performance achieving a prediction accuracy as high as 93%. Additionally, the well-trained SVM model was successfully used to predict the lithology profile of blind wells. Our findings provide valuable guidance for predicting the remaining oil distribution and further exploration potential in the Niuxintuo oilfield. Furthermore, this study gains insight into the process and methodology of rapidly predicting lithology of hydrocarbon reservoirs using easily accessible well logging data.</p>
</abstract>
<kwd-group>
<kwd>lithology classification</kwd>
<kwd>machine learning</kwd>
<kwd>support vector machine</kwd>
<kwd>random forest</kwd>
<kwd>convolutional neural networks</kwd>
<kwd>back propagation neural network</kwd>
<kwd>bayes distinguish analysis</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Economic Geology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Lithology identification is a crucial issue in reservoir characterization, as it helps correlate critical reservoir properties such as porosity, permeability and oil saturation, and plays a vital role in constructing field-scale reservoir models. Well log data have advantages such as high vertical resolution, good continuity, and convenient data acquisition. Therefore, they are an important resource for obtaining underground lithological information. Lithology classification based on well log data forms the foundation for reservoir characterization and provides a basis for geological studies such as sedimentary facies and environmental analysis. In addition to its significance in formation evaluation and geological analysis, lithology interpretation plays an important role in predicting sweet spot reservoirs and forecasting remaining oil distribution. The traditional methods for interpreting lithology mainly include cross-plot technique (e.g., <xref ref-type="bibr" rid="B33">Sanyal et al., 1980</xref>), curve feature method (<xref ref-type="bibr" rid="B2">Anifowose et al., 2019</xref>), imaging logging chart method (<xref ref-type="bibr" rid="B9">Cohn et al., 1996</xref>), multiple linear regression method (<xref ref-type="bibr" rid="B11">Delfiner et al., 1987</xref>), and discriminant analysis method (<xref ref-type="bibr" rid="B12">Dong et al., 2016</xref>; <xref ref-type="bibr" rid="B13">Dong et al., 2022</xref>). However, each of the method have some limitations (<xref ref-type="bibr" rid="B36">Sun et al., 2019</xref>). For example, a lack of clarity in the relationships between the data points may result in the cross-plot technique failed. Moreover, and it cannot display higher dimensional spatial information, and usually only two parameters can be considered at the same time (<xref ref-type="bibr" rid="B28">McDowell et al., 1998</xref>). Multiple linear regression method is very sensitive to highly correlated independent variables, and the relationship between variables is often nonlinear, which may lead to a decrease in the explanatory power of the model (<xref ref-type="bibr" rid="B11">Delfiner et al., 1987</xref>). Discriminant analysis methods require a large number of high-quality datasets, and are limited by some assumed premises (<xref ref-type="bibr" rid="B12">Dong et al., 2016</xref>). Overall, these methods generally require a large number of samples, which are very time-consuming. Recognizing lithology boundaries from well log data is inherently a nonlinear problem, primarily because log curves are influenced by rock properties like pore fluids. Therefore, it is essential to develop a suitable nonlinear approach that can effectively address these challenges.</p>
<p>The rapid advancement of computer technology has enabled machine learning methods to offer more time and cost-effective solutions with higher lithology identification accuracy, compared to traditional lithology identification methods (e.g., <xref ref-type="bibr" rid="B3">Ashraf et al., 2021</xref>; <xref ref-type="bibr" rid="B7">Bressan et al., 2020</xref>). Nowadays, numerous machine learning methods have emerged and been successfully applied to lithology identification (e.g., <xref ref-type="bibr" rid="B40">Wang et al., 2014</xref>; <xref ref-type="bibr" rid="B4">Bhattacharya et al., 2016</xref>; <xref ref-type="bibr" rid="B5">Biau and Scornet, 2016</xref>; <xref ref-type="bibr" rid="B34">Saporetti et al., 2018</xref>; <xref ref-type="bibr" rid="B42">Wang et al., 2020</xref>; <xref ref-type="bibr" rid="B47">Zhang et al., 2023</xref>). Machine learning can be categorized into three types: unsupervised learning, semi-supervised learning, and supervised learning. Unsupervised learning techniques, such as expectation maximisation (<xref ref-type="bibr" rid="B30">Miyahara et al., 2020</xref>), K-mean clustering (<xref ref-type="bibr" rid="B18">Huang et al., 2016</xref>), hierarchical clustering (<xref ref-type="bibr" rid="B38">Vichi et al., 2022</xref>), and deep autocoders (<xref ref-type="bibr" rid="B21">Kampffmeyer et al., 2018</xref>), are used only by arranging the lithology according to its intrinsic characteristics to provide an overall perspective. They are helpful when the dataset is limited (there are no available labels). In contrast, semi-supervised learning techniques (SSL), such as forward and unlabeled machine learning (<xref ref-type="bibr" rid="B17">Helm et al., 2023</xref>), active semi-supervised algorithms (<xref ref-type="bibr" rid="B43">Xu et al., 2021a</xref>; <xref ref-type="bibr" rid="B35">Shan et al., 2021</xref>), and Laplace Support Vector Machines (<xref ref-type="bibr" rid="B46">Yang and Xu, 2018</xref>), are beneficial when there is a limited amount of labelled data accessible. On the contrary, supervised learning techniques, which are suitable for learning a pattern in a known labelled species and inferring new instances in accordance with this pattern, can provide precise training data and therefore give very accurate results (<xref ref-type="bibr" rid="B20">Jordan and Mitchell, 2015</xref>). Several well-known supervised shallow learning algorithms are used for petrographic classification of core-tagging-based logs. This category includes backpropagation neural networks (<xref ref-type="bibr" rid="B1">Amari, 1993</xref>; <xref ref-type="bibr" rid="B14">Dong et al., 2023</xref>), support vector machine (SVM) (<xref ref-type="bibr" rid="B40">Wang et al., 2014</xref>), K-nearest neighbours (<xref ref-type="bibr" rid="B39">Wang et al., 2023</xref>; <xref ref-type="bibr" rid="B24">Li et al., 2024</xref>), and decision trees (DT) (<xref ref-type="bibr" rid="B50">Zhou et al., 2020</xref>). In addition, uniform integration techniques such as Random Forest (RF) (<xref ref-type="bibr" rid="B45">Yan et al., 2024</xref>), Extreme Gradient Boosting (<xref ref-type="bibr" rid="B8">Chen and Guestrin, 2016</xref>; <xref ref-type="bibr" rid="B48">Zheng et al., 2022</xref>), and Logistic Boosting Regression (<xref ref-type="bibr" rid="B19">Huang et al., 2019</xref>) belong to the same category, and such supervised algorithms use geological rules to make petrographic estimation more credible. In addition, several popular deep learning (DL) algorithms (<xref ref-type="bibr" rid="B16">Goodfellow et al., 2016</xref>; <xref ref-type="bibr" rid="B29">Miclea et al., 2020</xref>), such as convolutional neural networks (<xref ref-type="bibr" rid="B44">Xu et al., 2021b</xref>), recurrent neural networks (<xref ref-type="bibr" rid="B37">Tian et al., 2021</xref>) and long- and short-term memory networks (<xref ref-type="bibr" rid="B26">Lin et al., 2020</xref>), and TabNet (<xref ref-type="bibr" rid="B27">Madani et al., 2018</xref>; <xref ref-type="bibr" rid="B25">Li et al., 2022</xref>), possess very excellent properties such as weight sharing, local connectivity, and translational isotropy to effectively handle high-dimensional data.</p>
<p>The Niuxintuo reservoir is a typical lithological reservoir. Previous studies have shown that sedimentary environments significantly influence the lithology distribution. Moreover, the lithology controls petrophysical properties, and petrophysical properties control oil saturation (<xref ref-type="bibr" rid="B51">Zhou, 2022</xref>; <xref ref-type="bibr" rid="B23">Li, 2022</xref>). In this article, we applied multiple methods for lithology identification in the study area and select the most appropriate method for lithology prediction. Firstly, based on the detailed observation and description of rock cores, the lithology of the Niuxintuo area in is divided into six categories: fine sandstone, medium coarse sandstone, conglomerate, mudstone, transitional rock, and dolomite. Subsequently, the logging sequence is standardized and normalized to eliminate systematic errors, thereby improving the accuracy in describing, interpreting, and predicting reservoirs. Building on this, extensive cross plots are employed to evaluate the sensitivity of logging sequences. By integrating lithology sensitivity, data reliability, and curve complementarity, six key parameters&#x2014;acoustic transmit time (AC), compensated neutron (CNL), density (DEN), gamma ray (GR), resistivity (RT), and conductivity (CON_CAL)&#x2014;are selected as predictive curves for lithology identification. The initial step in multi-method lithology identification involves classifying lithology using Bayes discriminant analysis. However, with a prediction accuracy of only 58.20%, this approach falls short of meeting the requirements for reliable lithology prediction. Then, the focus shifted to exploring lithology identification using advanced machine learning algorithms, including RF, SVM, BPNN, and CNN. The developed machine learning classifiers demonstrate high prediction accuracy, with SVM achieving the best performance, boasting a prediction accuracy of up to 93%. The findings offer crucial guidance for forecasting remaining oil distribution and evaluating further exploration potential in the Niuxintuo oilfield. Moreover, this study provides valuable insights into the methodology and process of rapidly predicting hydrocarbon reservoir lithology using a large amount of logging data.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methodology</title>
<p>This section provides a detailed overview of lithology identification methods, including core lithology observation and statistics, well logging data preprocessing, Bayes discriminant analysis, and four machine learning methods for lithology identification. The overall workflow is show in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Lithology identification flowchart of this study. <bold>(A)</bold> Data preparation. <bold>(B)</bold> Construction of multiple lithology recognition classifiers. <bold>(C)</bold> Discussion on Classification Resultsand Blind Well test.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g001.tif"/>
</fig>
<sec id="s2-1">
<title>2.1 Core lithology observation and statistics</title>
<p>The lithology types of Niuxintuo Oilfield are complex. Based on the detailed observation of core samples along with thin section data, the lithology types in the study area are summarized. Overall, the lithology of Niuxintuo reservoir can be divided into two categories: one is the alluvial fan type clastic rock composed of fine sandstone, siltstone, medium sandstone, coarse sandstone, and gravel rock; The other type is laminated dolomite and muddy dolomite with transitional fan edge lake facies (<xref ref-type="fig" rid="F2">Figures 2</xref>, <xref ref-type="fig" rid="F3">3</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Typical core photographs for different lithologies of Niuxintuo reservoir. <bold>(A)</bold> Tuo22,1693.72 m, fine sandstone; <bold>(B)</bold> Tuo 32&#x2013;34, 1713.56 m, medium sandstone; <bold>(C)</bold> Tuoguan 2, 1790.08 m, coarse sandstone; <bold>(D)</bold> Tuo 22, 1707.66 m, gravel rock; <bold>(E)</bold> Tuo 31&#x2013;39, 1860.71 m, argillaceous limestone; <bold>(F)</bold> Tuo 25&#x2013;33, 2,328.86 m, silty mudstone; <bold>(G)</bold> Tuo 32&#x2013;34, 1745.69 m, argillaceous dolomite; <bold>(H)</bold> Tuo 12, 2,103.66 dolomite; <bold>(I)</bold> Tuo 32&#x2013;34, 1748.77 m, dolomitic mudstone.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Casting thin section of different lithologies. <bold>(A)</bold> Tuo 31&#x2013;39, 1,690.28 m, fine sandstone; <bold>(B)</bold> Tuo 25&#x2013;33, 2,396.43 m, gravelly fine sandstone; <bold>(C)</bold> Tuo 31&#x2013;39, 1785.74 m, medium sandstone; <bold>(D)</bold> Tuo 14, 1,557.87 m, coarse sandstone; <bold>(E)</bold> Tuo 25&#x2013;33, 2,324.63 m, conglomerate; <bold>(F)</bold> Tuo 25&#x2013;33, 2,321.46 m, silty mudstone; <bold>(G)</bold> Tuo 31&#x2013;39, 1719.58 m, fine sand mixed with mudstone; <bold>(H)</bold> Tuo 12, 1,663.19 m, dolomite; <bold>(I)</bold> Tuo 32&#x2013;34, 1745.6 m, muddy dolomite.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g003.tif"/>
</fig>
<p>Furthermore, through the observation of cast thin sections and analysis of mineral composition, genetic processes, compositional content, and sedimentary structures, the lithology has been further subdivided into 19 fundamental rock types (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Lithology types of the niuxintuo oil reservoir.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="2" align="center">Basic rock types from cores</th>
<th align="center">Classification of logging lithology</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="5" align="center">Clastic rock</td>
<td align="center">Unequal-grained sandstone, conglomerate</td>
<td align="center">Conglomerate</td>
</tr>
<tr>
<td align="center">Coarse sandstone, pebbly coarse sandstone</td>
<td rowspan="2" align="center">Medium-coarse sandstone</td>
</tr>
<tr>
<td align="center">Medium sandstone, pebbly medium sandstone</td>
</tr>
<tr>
<td align="center">Fine sandstone, pebbly fine sandstone, and dolomitic fine sandstone</td>
<td align="center">Fine sandstone</td>
</tr>
<tr>
<td align="center">Mudstone</td>
<td align="center">Mudstone</td>
</tr>
<tr>
<td rowspan="2" align="center">Transitional rocks</td>
<td align="center">Mudstone with gravel, silty mudstone, and dolomitic mudstone</td>
<td rowspan="2" align="center">Transitional rocks</td>
</tr>
<tr>
<td align="center">Siltstone, pebbly siltstone, argillaceous siltstone</td>
</tr>
<tr>
<td rowspan="2" align="center">Carbonate</td>
<td align="center">Dolomite</td>
<td rowspan="2" align="center">Dolomite</td>
</tr>
<tr>
<td align="center">Argillaceous dolomite</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Cross plot is the most commonly used method for displaying the relationships between variables and is widely used in reservoir research (<xref ref-type="bibr" rid="B15">Ehsan and Gu, 2020</xref>). It can display different logging data on the same plane and evaluate the relationships between these data through the position and shape of the intersection points. Accurate lithology identification and characterization require first understanding the physical property differences among various rock types, followed by selecting suitable logging parameters for quantitative differentiation.</p>
<p>Using the preprocessed logging sequences and core lithology labels, a cross-plot analysis was conducted to identify lithology-sensitive logging curves (<xref ref-type="fig" rid="F4">Figure 4</xref>). Considering lithology sensitivity, data quality reliability, and curve complementarity, AC, CNL, DEN, GR, RT, and CON_CAL were selected as lithology-sensitive curves for subsequent research on logging-based lithology identification.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Well logging cross plots of different lithologies. <bold>(A)</bold> AC-CNL cross plot; <bold>(B)</bold> AC-DEN cross plot; <bold>(C)</bold> DEN-CON_CAL cross plot; <bold>(D)</bold> DEN-CNL cross plot; <bold>(E)</bold> GR-RT cross plot; <bold>(F)</bold> AC-GR cross plot.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g004.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F4">Figures 4A, B</xref> illustrates that the AC-CNL and AC-DEN cross-plots exhibit strong lithological differentiation, whereas the RT-GR and DEN-CON_CAL cross-plots yield moderate results (<xref ref-type="fig" rid="F4">Figures 4C, D</xref>). In contrast, the CNL-DEN and GR-AC cross-plots demonstrate the least effectiveness (<xref ref-type="fig" rid="F4">Figures 4E, F</xref>). <xref ref-type="fig" rid="F5">Figure 5</xref> indicates that dolomite has a higher GR value and slightly larger neutron response, making it easy to distinguish. The characteristics of mudstone are high GR value, low RT value, high AC value, and low density, with high discrimination. The GR value of fine siltstone shows a medium to low value, with a slightly higher neutron response. The GR value of sandy conglomerate shows a medium to low value, while the CNL value is small.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Logging response characteristics of different lithologies.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g005.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>2.2 Standardization of logging data</title>
<p>Logging sequence data preprocessing provides near-wellbore stratigraphic information, which can be used to identify changes in stratigraphic interfaces, lithology, and sedimentary environments. However, in practical work, due to measurement errors, noise and outliers, depth migration or missing data, directly using raw logging data for lithology inversion may lead to data mismatch, lack of spatial constraints, low signal-to-noise ratio, and parameter mismatch, which will inevitably affect the accuracy of inversion results (<xref ref-type="bibr" rid="B48">Zheng et al., 2022</xref>). Therefore, preprocessing logging curves can improve data quality and availability, eliminate the influence of non-geological factors, and truly reflect stratigraphic characteristics.</p>
<p>The Niuxintuo Oilfield in Liaohe has a long history of development. Over the course of extensive exploration and production activities, systematic errors have emerged in the logging data due to ongoing updates and changes in logging instruments. If the original logging sequence data is directly used for reservoir description, it will affect the accuracy and reliability of the results. Therefore, standardizing logging data can help eliminate systematic errors and enhance the ability to describe, interpret, and predict reservoirs (<xref ref-type="bibr" rid="B48">Zheng et al., 2022</xref>).</p>
<p>The key to standardizing logging data is the selection of standard layers, usually selecting mudstones or coal seams with a certain thickness that are stably developed throughout the area. There is a total of seven sets of oil bearing formations in the Niuxintuo oil reservoir. Using GES (Geological Evaluation System) software, the AC, CNL, DEN, GR, RT, and CON_CAL logging curves were standardized in batches.</p>
</sec>
<sec id="s2-3">
<title>2.3 Bayes discriminant analysis</title>
<p>Discriminant analysis is a statistical learning method used to establish one or more discriminant functions and assign sample points to different categories (<xref ref-type="bibr" rid="B10">Cui et al., 2023</xref>). The goal is to identify features or variables that can distinguish different categories to the greatest extent by analyzing training samples of known categories, and use these features or variables to construct discriminant functions to classify unknown samples.</p>
</sec>
<sec id="s2-4">
<title>2.4 Random forest</title>
<p>RF uses Bagging to construct multiple training datasets through self-sampling, and then constructs a base classifier for each sample set, which can improve the overall performance and robustness of the model (<xref ref-type="bibr" rid="B6">Breiman, 2001</xref>). Evaluate the contribution of each feature to the model&#x2019;s predictive performance during classification by calculating the information gain rate of variables. This approach quantifies the importance of each feature parameter, allowing for the selection of variables with higher information gain rates. By focusing on these key variables, the modeling process becomes more streamlined, the influence of redundant features is minimized, and both the model&#x2019;s performance and its generalization capability are enhanced.</p>
</sec>
<sec id="s2-5">
<title>2.5 Support vector machine</title>
<p>SVM is a binary classification model. The basic principle is to construct a hyperplane with maximum spacing in a specific space to achieve correct partitioning of samples of different categories (<xref ref-type="bibr" rid="B40">Wang et al., 2014</xref>). For a given training dataset, multiple hyperplanes may satisfy the separation conditions. However, the objective of SVM is to identify the unique hyperplane that maximizes the margin, ensuring the greatest possible separation between classes. Lithology recognition belongs to multi classification problems. For multi classification problems, SVM can adopt one to many (One vs. Rest) or one to one (One vs. One) classification strategies (<xref ref-type="bibr" rid="B40">Wang et al., 2014</xref>). In the one-to-many method, each category is combined with other categories to construct multiple binary classification models for classification. In the one-on-one method, a binary classification model is constructed for each pair of categories, and the final result is determined as the category with the highest number of votes through voting or other strategies. Whether it is a binary classification problem or a multi classification problem, SVM can solve it and exhibits good performance in handling high-dimensional data and nonlinear problems.</p>
</sec>
<sec id="s2-6">
<title>2.6 Back propagation neural network</title>
<p>BPNN is a multi-layer feedforward neural network trained according to the error backpropagation algorithm (<xref ref-type="bibr" rid="B32">Rumelhart et al., 1986</xref>). The learning rule involves using the steepest descent method to iteratively adjust the network&#x2019;s weights and thresholds through backpropagation, aiming to minimize the network&#x2019;s total squared error (<xref ref-type="bibr" rid="B14">Dong et al., 2023</xref>; <xref ref-type="bibr" rid="B41">Wang and Wang, 2021</xref>). The neural network consists of three parts: input layer, hidden layer, and output layer. The main process of BP neural networks is divided into two stages, namely, signal forward propagation and error back propagation. Signal forward propagation refers to the process of transmitting information from the input layer through the hidden layer to the output layer. In contrast, error backpropagation involves transmitting the error from the output layer to the input layer, sequentially adjusting the weights and biases of the hidden-to-output and input-to-hidden layers (<xref ref-type="bibr" rid="B14">Dong et al., 2023</xref>; <xref ref-type="bibr" rid="B31">Peng et al., 2024</xref>). The main factors affecting the performance of BP neural networks include the number of hidden layer nodes, the selection of activation functions, and the parameter setting of learning rates.</p>
<p>Based on the preprocessing of logging data, we analyze the factors influencing lithology and select the preferred logging response parameters&#x2014;AC, CNL, DEN, GR, RT, and CON_CAL&#x2014;as input features for the model. This means the input layer consists of six neurons. The initial number of neurons in the hidden layer is set to 1&#x2013;2 times the number of input neurons. The optimal number of hidden layer neurons is then determined automatically during the learning process through network structure optimization. The output layer consists of six types of lithology, that is, the number of output layer nodes is six. Basic architecture of a BPNN model is shown in <xref ref-type="fig" rid="F6">Figure 6</xref>.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Basic architecture of a BP neural network.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g006.tif"/>
</fig>
</sec>
<sec id="s2-7">
<title>2.7 Convolutional neural networks</title>
<p>CNN are an important type of artificial neural network, but they are independent of traditional neural networks such as multi-layer perceptual neural networks, RBF neural networks, and fuzzy logic neural networks (<xref ref-type="bibr" rid="B49">Zhong et al., 2019</xref>). CNN consists of five layers: data input layer, convolutional computing layer, ReLU excitation layer, pooling layer, and fully connected layer. CNN combines three steps to achieve pattern recognition, including local acceptance domain, weight sharing, and under sampling. The local receptive field refers to the set of units within each layer of the neural network that are connected to the previous layer. Each neuron in this small neighborhood extracts fundamental visual features, such as line segments, endpoints, and angles, from the input data. Weight sharing refers to CNN sharing the weights of some neurons; Therefore, fewer parameters are optimized during the training process. Under sampling can reduce the feature resolution of displacement, amplification, and other forms of distortion invariance (<xref ref-type="bibr" rid="B22">Le and Borji, 2017</xref>; <xref ref-type="bibr" rid="B49">Zhong et al., 2019</xref>).</p>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>3 Results and discussion</title>
<sec id="s3-1">
<title>3.1 Lithological classification based on bayes discriminant analysis</title>
<p>Binary classification problems are typically addressed using the Fisher criterion, while the Bayes criterion is commonly employed for multi-class classification problems. To tackle the lithology identification of clastic rocks using well logging data, this study develops a discriminant function based on the Bayes criterion. Substitute the logging curve data values for each lithology sample into the following six Bayes discriminant functions to calculate the corresponding function values. Comparing the values of these six functions, which function has the highest value can determine which category the sample is classified into. The coefficients of the Bayesian discriminant function are shown below (<xref ref-type="table" rid="T2">Table 2</xref>).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Bayesian discriminant analysis equation coefficients for different lithologies.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Logging curve</th>
<th align="center">Fine sandstone</th>
<th align="center">Medium coarse sandstone</th>
<th align="center">Conglomerate</th>
<th align="center">Mudstone</th>
<th align="center">Transitional rocks</th>
<th align="center">Dolomite</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">AC</td>
<td align="center">1.048</td>
<td align="center">1.050</td>
<td align="center">1.065</td>
<td align="center">1.126</td>
<td align="center">1.078</td>
<td align="center">1.065</td>
</tr>
<tr>
<td align="center">CNL</td>
<td align="center">2.038</td>
<td align="center">2.129</td>
<td align="center">2.055</td>
<td align="center">2.224</td>
<td align="center">2.051</td>
<td align="center">2.027</td>
</tr>
<tr>
<td align="center">DEN</td>
<td align="center">304.246</td>
<td align="center">308.284</td>
<td align="center">311.549</td>
<td align="center">304.854</td>
<td align="center">310.230</td>
<td align="center">307.489</td>
</tr>
<tr>
<td align="center">GR</td>
<td align="center">0.154</td>
<td align="center">0.179</td>
<td align="center">0.141</td>
<td align="center">0.198</td>
<td align="center">0.174</td>
<td align="center">0.206</td>
</tr>
<tr>
<td align="center">RT</td>
<td align="center">0.126</td>
<td align="center">0.138</td>
<td align="center">0.127</td>
<td align="center">0.128</td>
<td align="center">0.121</td>
<td align="center">0.123</td>
</tr>
<tr>
<td align="center">CON_CAL</td>
<td align="center">0.053</td>
<td align="center">0.056</td>
<td align="center">0.053</td>
<td align="center">0.057</td>
<td align="center">0.052</td>
<td align="center">0.051</td>
</tr>
<tr>
<td align="center">(constant)</td>
<td align="center">&#x2212;560.977</td>
<td align="center">&#x2212;576.291</td>
<td align="center">&#x2212;584.414</td>
<td align="center">&#x2212;596.900</td>
<td align="center">&#x2212;586.249</td>
<td align="center">&#x2212;576.476</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>According to the Bayes discriminant coefficient table, the Bayes discriminant function can be listed as follows (<xref ref-type="disp-formula" rid="e1">Equations 1</xref>&#x2013;<xref ref-type="disp-formula" rid="e6">6</xref>):<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Fine&#x2009;sandstone</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>560.977</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.048</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.038</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>304.246</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="8em"/>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.154</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.126</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.053</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="8em"/>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CON</mml:mtext>
<mml:mo>_</mml:mo>
<mml:mtext>CAL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>
<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Medium&#x2009;coarse&#x2009;sandstone</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>576.291</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.050</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.129</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="11.5em"/>
<mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>308.284</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.179</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="11.5em"/>
<mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.138</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.056</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CO</mml:mtext>
<mml:mi>N</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>C</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m3">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Conglomerate</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>584.414</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.065</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.055</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>311.549</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="8em"/>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.141</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.127</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="8em"/>
<mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.053</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CO</mml:mtext>
<mml:mi>N</mml:mi>
<mml:mo>_</mml:mo>
<mml:mi>C</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
<disp-formula id="e4">
<mml:math id="m4">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Mudstone</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>596.900</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.126</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.224</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>304.854</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mspace width="6em"/>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.198</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.128</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.057</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mspace width="6em"/>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CON</mml:mtext>
<mml:mo>_</mml:mo>
<mml:mtext>CAL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
<disp-formula id="e5">
<mml:math id="m5">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Transitional&#x2009;rocks</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>586.249</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.078</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.051</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mspace width="9em"/>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>310.230</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.174</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.121</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mspace width="9em"/>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.052</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CON</mml:mtext>
<mml:mo>_</mml:mo>
<mml:mtext>CAL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
<disp-formula id="e6">
<mml:math id="m6">
<mml:mrow>
<mml:mtable columnalign="left">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mtext>Dolomite</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>576.476</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.065</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>AC</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.027</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CNL</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>307.489</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="5em"/>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>DEN</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.206</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>GR</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.123</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>RT</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.05</mml:mn>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mspace width="5em"/>
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mtext>CON</mml:mtext>
<mml:mo>_</mml:mo>
<mml:mtext>CAL</mml:mtext>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>
</p>
<p>As shown in <xref ref-type="table" rid="T3">Table 3</xref>, the discriminant coincidence rate was determined by comparing the classification results obtained by substituting the observed lithology values into the discriminant function with the original classifications. The lithology codes are indicated in <xref ref-type="table" rid="T3">Table 3</xref> footnote. In this case, the accuracy is 58.2%, indicating that the discriminant analysis method demonstrates limited accuracy in identifying lithology within this study area. The limitations of Bayesian discriminant analysis in lithology identification primarily arise from the following factors. First, the algorithm&#x2019;s underlying assumptions pose significant challenges: it presumes that the data conforms to a specific probability distribution, typically a normal distribution for different categories. However, real-world lithological data often deviates from this assumption, leading to inaccurate classification outcomes. Additionally, the method assumes that all features are independent, a condition rarely met in practice. In lithological datasets, features frequently exhibit interdependencies, and ignoring these correlations can diminish the model&#x2019;s accuracy. Furthermore, Bayesian discriminant analysis struggles with handling the inherent complexity of lithological data, limiting its effectiveness in more intricate classification tasks. When addressing complex lithological types, Bayesian discriminant analysis often fails to capture underlying nonlinear relationships, resulting in suboptimal performance under intricate geological conditions.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Lithology classification result matrix.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Lithology</th>
<th align="center">1</th>
<th align="center">2</th>
<th align="center">3</th>
<th align="center">4</th>
<th align="center">5</th>
<th align="center">6</th>
<th align="center">Total</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">1</td>
<td align="center">95.0</td>
<td align="center">28.0</td>
<td align="center">54.0</td>
<td align="center">43.0</td>
<td align="center">152.0</td>
<td align="center">0.0</td>
<td align="center">372.0</td>
</tr>
<tr>
<td align="center">2</td>
<td align="center">88</td>
<td align="center">200</td>
<td align="center">29</td>
<td align="center">0</td>
<td align="center">73</td>
<td align="center">18</td>
<td align="center">408</td>
</tr>
<tr>
<td align="center">3</td>
<td align="center">197</td>
<td align="center">6</td>
<td align="center">313</td>
<td align="center">7</td>
<td align="center">292</td>
<td align="center">0</td>
<td align="center">815</td>
</tr>
<tr>
<td align="center">4</td>
<td align="center">12</td>
<td align="center">12</td>
<td align="center">8</td>
<td align="center">546</td>
<td align="center">61</td>
<td align="center">16</td>
<td align="center">655</td>
</tr>
<tr>
<td align="center">5</td>
<td align="center">22</td>
<td align="center">0</td>
<td align="center">38</td>
<td align="center">4</td>
<td align="center">294</td>
<td align="center">0</td>
<td align="center">358</td>
</tr>
<tr>
<td align="center">6</td>
<td align="center">15</td>
<td align="center">2</td>
<td align="center">30</td>
<td align="center">0</td>
<td align="center">58</td>
<td align="center">314</td>
<td align="center">419</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Note: 1-fine sandstone; 2-Medium coarse sandstone; 3-Sandstone; 4-mudstone; 5-Transitional rocks; 6-Dolomite.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3-2">
<title>3.2 Machine learning methods for lithology recognition</title>
<sec id="s3-2-1">
<title>3.2.1 Data preparation</title>
<p>This study used 3,027 sets of logging and core data from 8 core wells in the study area, with 70% of the data for training and 30% for testing. These two datasets each have different functions. The training set is used to create machine learning models and model hyperparameter optimization, while the testing set is used to evaluate the performance of trained machine learning model. The lithological labels of 1&#x2013;6 correspond to six main lithologies: fine sandstone, medium to coarse sandstone, conglomerate, mudstone, transitional rocks, and dolomite (<xref ref-type="table" rid="T4">Table 4</xref>).</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Lithology distribution of core samples in the study area.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Lithology</th>
<th align="center">Number of samples</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Fine sandstone</td>
<td align="center">372</td>
</tr>
<tr>
<td align="center">Medium coarse sandstone</td>
<td align="center">408</td>
</tr>
<tr>
<td align="center">Conglomerate</td>
<td align="center">815</td>
</tr>
<tr>
<td align="center">Mudstone</td>
<td align="center">655</td>
</tr>
<tr>
<td align="center">Transitional rocks</td>
<td align="center">358</td>
</tr>
<tr>
<td align="center">Dolomite</td>
<td align="center">419</td>
</tr>
<tr>
<td align="center">Total</td>
<td align="center">3,027</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The following six conventional logging parameters&#x2014;AC, CNL, DEN, GR, RT, and CON_CAL&#x2014;are selected as sample attribute values. These parameters form a 7-dimensional vector, comprising six dimensions of parameter values and one dimension for the corresponding lithology label. In machine learning, feature normalization is often essential to eliminate dimensional differences, minimize feature biases, and mitigate the impact of outliers. Normalizing data not only accelerates the training model&#x2019;s convergence but also facilitates reaching the optimal solution more efficiently. The normalization of logging curves maps the values of the curves to (0,1) through linear transformation. The definition is defined as <xref ref-type="disp-formula" rid="e1">Equation 7</xref>:<disp-formula id="e7">
<mml:math id="m7">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mo>&#x2a;</mml:mo>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi mathvariant="italic">min</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi mathvariant="italic">max</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi mathvariant="italic">min</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>Among them, <inline-formula id="inf1">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi mathvariant="italic">max</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf2">
<mml:math id="m9">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi mathvariant="italic">min</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the maximum and minimum values in the set of curve values, respectively. Through this processing method, the normalized logging data values will fall within the [0,1] interval, making it easier to compare and analyze.</p>
<p>Exploratory data analysis is performed by creating correlation matrix diagrams to visualize the relationships between different lithologies and logging parameters. <xref ref-type="fig" rid="F7">Figure 7</xref> presents the correlation matrix diagram illustrating the relationships between various lithologies and logging parameters. The horizontal and vertical axes correspond to six logging parameters, while the diagonal showcases the distribution histograms of different lithologies associated with the parameters on the horizontal axis. Different colors represent various lithologies, and the significant overlap among most logging parameters indicates a lack of clear boundaries, making model classification challenging.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Correlation matrix of different lithology and logging parameters.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g007.tif"/>
</fig>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Model parameter optimization</title>
<p>To obtain the optimal machine learning model, grid search and 5-fold cross validation methods were used to optimize the hyperparameters of RF, SVM, BPNN, and CNN models (<xref ref-type="table" rid="T5">Table 5</xref>). The optimization process for the key parameters is illustrated in <xref ref-type="fig" rid="F8">Figure 8</xref>, while unmentioned parameters are set to default values to enhance the model&#x2019;s accuracy. 5-fold cross-validation provides a reliable estimate of model performance, helps identify optimal parameter settings, and mitigates the risks of overfitting or underfitting. It is widely used for evaluating models and selecting the best parameters, making it suitable for a variety of datasets. The main step of 5-fold cross-validation involves randomly splitting the dataset into five equal parts. Each time, one part is used as the test set, while the remaining four parts serve as the training set. This process is repeated for each part. The optimal parameter combination is then selected based on the highest cross-validation score from the candidate set. After parameter tuning, we optimized the classifier parameters to achieve the best combination (<xref ref-type="table" rid="T5">Table 5</xref>).</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Optimum parameter values for each model.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Classifier</th>
<th align="center">Optimal hyperparameter</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">RF</td>
<td align="center">cv folds &#x3d; 5; criterion &#x3d; &#x201c;gini&#x201d;; max depth &#x3d; 29; min leaf size &#x3d; 1; min parent &#x3d; 13; num trees &#x3d; 70</td>
</tr>
<tr>
<td align="center">SVM</td>
<td align="center">cv folds &#x3d; 5; kernel &#x3d; &#x2018;RBF&#x2019;; C &#x3d; 32; gamma &#x3d; 32</td>
</tr>
<tr>
<td align="center">BPNN</td>
<td align="center">hidden layer size range &#x3d; 16; epochs range &#x3d; 1,000; goal range &#x3d; 1e-2<break/>learning rate range &#x3d; 0.01</td>
</tr>
<tr>
<td align="center">CNN</td>
<td align="center">training options &#x3d; &#x201c;adam&#x201d;&#x27;; max epochs &#x3d; 200; initial learn rate &#x3d; 1e-3<break/>L2regularization &#x3d; 1e-04; learn rate drop factor &#x3d; 0.5; learn rate drop period &#x3d; 150</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Machine learning algorithms partially hyperparameter optimization. <bold>(A)</bold> RF decision tree optimization; <bold>(B)</bold> SVM hyperparameter optimization; <bold>(C)</bold> BPNN mean square error; <bold>(D)</bold> CNN Training Progress.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g008.tif"/>
</fig>
</sec>
</sec>
<sec id="s3-3">
<title>3.3 Comparison of four machine learning lithology methods</title>
<sec id="s3-3-1">
<title>3.3.1 Evaluation criterion</title>
<p>The performance of the classification models is evaluated using indicators such as accuracy, precision, recall, and F1-score (<xref ref-type="bibr" rid="B48">Zheng et al., 2022</xref>) (<xref ref-type="disp-formula" rid="e8">Equations 8</xref>&#x2013;<xref ref-type="disp-formula" rid="e11">11</xref>). Accuracy represents the proportion of correct predictions (both positive and negative) out of all predictions. Precision measures the proportion of true positives among the samples predicted as positive. Recall refers to the proportion of correct positive samples among the total actual positives. F1 score is the harmonic average of recall rate and precision rate, which considers the accuracy of the model in predicting positive samples (recall rate) and its recognition ability for positive samples (recall rate). These standard calculation formulas are as follows:<disp-formula id="e8">
<mml:math id="m10">
<mml:mrow>
<mml:mtext>Accuracy</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
<disp-formula id="e9">
<mml:math id="m11">
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(9)</label>
</disp-formula>
<disp-formula id="e10">
<mml:math id="m12">
<mml:mrow>
<mml:mtext>Recall</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(10)</label>
</disp-formula>
<disp-formula id="e11">
<mml:math id="m13">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x22c5;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(11)</label>
</disp-formula>
</p>
<p>TP refers to the cases where both the prediction and the actual value are positive. FP refers to the cases where the prediction is positive but the actual value is negative. FN refers to the cases where the prediction is negative but the actual value is positive. TN refers to the cases where both the prediction and the actual value are negative.</p>
</sec>
<sec id="s3-3-2">
<title>3.3.2 Analysis of single point prediction results</title>
<p>After building each machine learning model, the performance of the models is validated and tested. The results are then compared across the four classifiers to evaluate their relative effectiveness (<xref ref-type="fig" rid="F9">Figure 9</xref>). <xref ref-type="fig" rid="F10">Figure 10</xref> shows the comparison of prediction accuracy results among different models. Among them, SVM has the best classification performance, with a prediction accuracy of 93.87% in the training set and 92.72% in the test set. CNN took second place, with a prediction accuracy of 91.50% for the training set and 90.98% for the test set. The prediction accuracy of the RF training set is 90.33%, and the prediction accuracy of the test set is 89.65%. BPNN has the lowest accuracy, with a prediction accuracy of 86.08% for the training set and 85.01% for the test set. From the above, each machine learning classifier constructed has a high prediction accuracy, with an accuracy rate above 85%. SVM has the best classification performance, with a prediction accuracy rate of up to 93%. The confusion matrices (<xref ref-type="fig" rid="F11">Figure 11</xref>) reveal the misclassification patterns of lithology classes for each model, emphasizing which classes are mistakenly predicted as others. In addition, RF can be used to explain the importance of different parameters in various classification and regression models for model prediction results. The importance ranking of logging parameters for lithology identification based on RF is: GR, AC, RT, CON_ CAL, CNL, DEN (<xref ref-type="fig" rid="F12">Figure 12</xref>).</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Prediction results of each machine learning classifier. <bold>(A)</bold> RF training set test results; <bold>(B)</bold> RF testing set test results; <bold>(C)</bold> SVM training set test results; <bold>(D)</bold> SVM testing set test results; <bold>(E)</bold> BPNN training set test results; <bold>(F)</bold> BPNN testing set test results; <bold>(G)</bold> CNN training set test results; <bold>(H)</bold> CNN testing set test results.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g009.tif"/>
</fig>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Comparison of prediction accuracy of four machine learning models.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g010.tif"/>
</fig>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>Confusion matrix of each machine learning classifier. <bold>(A)</bold> RF training set confusion matrix; <bold>(B)</bold> RF testing set confusion matrix; <bold>(C)</bold> SVM training set confusion matrix; <bold>(D)</bold> SVM testing set confusion matrix; <bold>(E)</bold> BPNN training set confusion matrix; <bold>(F)</bold> BPNN testing set confusion matrix; <bold>(G)</bold> CNN training set confusion matrix; <bold>(H)</bold> CNN testing set confusion matrix.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g011.tif"/>
</fig>
<fig id="F12" position="float">
<label>FIGURE 12</label>
<caption>
<p>Analysis of the importance of logging parameters in RF classifier.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g012.tif"/>
</fig>
<p>The comparison of average precision (<xref ref-type="fig" rid="F13">Figure 13A</xref>) and average F1-score results (<xref ref-type="fig" rid="F13">Figure 13B</xref>) for different models. It can be observed that the BPNN model has the lowest average precision (84.7%) and F1-score (0.84). The RF model ranks second, with an average precision of 91.2% and an F1-score of 0.89. The CNN model achieves a relatively high average accuracy of 92.1%, with an F1-score of 0.91. The SVM model delivers the highest performance, with an average precision of 92.7% and an F1-score of 0.92. In summary, SVM has the best lithology recognition performance, followed by CNN, with both F1-score higher than 0.9, superior to RF and BPNN.</p>
<fig id="F13" position="float">
<label>FIGURE 13</label>
<caption>
<p>Comparison of lithology identification results of different models. <bold>(A)</bold> Average prediction accuracy of different models; <bold>(B)</bold> Average F1-score for different models.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g013.tif"/>
</fig>
<p>As shown in <xref ref-type="table" rid="T6">Table 6</xref>, each model demonstrates varying recognition capabilities for different lithology types. SVM showed the highest average F1-score, reaching 0.92. Among them, except for transitional rocks, the F1-score of all other lithologies exceeds 0.92, and the transitional rocks are mainly divided into fine sandstone and medium to coarse sandstone. This could be attributed to the fact that the siltstone class is a non-reservoir in the study area, and the logging response characteristics of fine sandstone and siltstone are quite similar. When classifying lithology, they are classified as transitional rocks, resulting in the lowest prediction accuracy of other models in transitional rocks. The F1-score of CNN and RF is second to SVM, with a high F1-score of 0.96 for both mudstone and dolomite, and the classification of lithology types is relatively similar. The main classification is that fine sandstone and medium to coarse sandstone are divided into conglomerate and transitional rocks are divided into sandy conglomerate and fine sandstone. BPNN also has a high F1-score of 0.91 for both mudstone and dolomite, and the lowest F1-score of 0.64 for transitional rocks. In summary, the SVM classifier demonstrates the best overall performance in lithology identification and is therefore used for lithology prediction in the study area.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>F1-Score for different lithologies using different models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Lithology</th>
<th align="center">RF</th>
<th align="center">SVM</th>
<th align="center">BPNN</th>
<th align="center">CNN</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Fine sandstone</td>
<td align="center">0.77</td>
<td align="center">0.94</td>
<td align="center">0.87</td>
<td align="center">0.82</td>
</tr>
<tr>
<td align="center">Medium coarse sandstone</td>
<td align="center">0.86</td>
<td align="center">0.96</td>
<td align="center">0.82</td>
<td align="center">0.92</td>
</tr>
<tr>
<td align="center">Conglomerate</td>
<td align="center">0.88</td>
<td align="center">0.92</td>
<td align="center">0.84</td>
<td align="center">0.89</td>
</tr>
<tr>
<td align="center">Mudstone</td>
<td align="center">0.97</td>
<td align="center">0.96</td>
<td align="center">0.95</td>
<td align="center">0.96</td>
</tr>
<tr>
<td align="center">Transitional rocks</td>
<td align="center">0.87</td>
<td align="center">0.78</td>
<td align="center">0.64</td>
<td align="center">0.86</td>
</tr>
<tr>
<td align="center">Dolomite</td>
<td align="center">0.96</td>
<td align="center">0.96</td>
<td align="center">0.91</td>
<td align="center">0.98</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-3-3">
<title>3.3.3 Lithology prediction in the uncored well</title>
<p>We further validated the effectiveness of the SVM classifier in lithology identification using two blind wells (<xref ref-type="fig" rid="F14">Figure 14</xref>). The results show a high consistency between the lithology predicted by the well-trained SVM model and the lithology observed in the cores, indicating that the well-trained SVM model provides reliable lithology predictions for uncored wells.</p>
<fig id="F14" position="float">
<label>FIGURE 14</label>
<caption>
<p>Comparison of core lithology and predicted lithology using well trained SVM classifier. <bold>(A)</bold> Tuo 31&#x2013;39 well; <bold>(B)</bold> Tuo 35&#x2013;33 well.</p>
</caption>
<graphic xlink:href="feart-13-1491334-g014.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<title>4 Conclusion</title>
<p>The main conclusions drawn in this article are as follows:<list list-type="simple">
<list-item>
<p>1. The cross-plot method is not effective in distinguishing lithology, but can help identify sensitive logging curves. The selected sensitive logging curves are: gamma ray (GR), acoustic transmit time (AC), resistivity (RT), conductivity (CON_CAL), compensated neutron (CNL), and density (DEN).</p>
</list-item>
<list-item>
<p>2. Except for Bayes discriminant analysis, all the constructed machine learning classifiers [i.e., Random Forest (RF), Support vector machine (SVM), Back propagation neural network (BPNN), and Convolutional neural networks (CNN)] demonstrate high prediction accuracy, with the accuracy rate exceeding 85%. Among them, SVM classification shows the best performance achieving a prediction accuracy as high as 93%. Blind well tests have confirmed the reliability of the well trained SVM model.</p>
</list-item>
<list-item>
<p>3. RF can be used to explain the importance of different parameters in various classification and regression models for model prediction results. The importance ranking of logging parameters for lithology identification in this study is: GR, AC, RT, CON_ CAL, CNL, DEN.</p>
</list-item>
</list>
</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>ZF: Conceptualization, Investigation, Methodology, Resources, Writing&#x2013;original draft, Writing&#x2013;review and editing. CH: Methodology, Supervision, Writing&#x2013;original draft. SJ: Methodology, Supervision, and Writing&#x2013;original draft. ML: Data curation, Formal Analysis, Writing&#x2013;original draft. YC: Resources, Validation, Writing&#x2013;original draft. YJ: Investigation, Software, Writing&#x2013;original draft. YL Data curation, Formal Analysis, Investigation, Writing&#x2013;review and editing. MT: Investigation, Resources, Writing&#x2013;original draft.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. The authors declare that this study received funding from CNPC Science and Technology special Project &#x201c;Research on Greatly Improved Oil recovery Technology in Ultra-high water cut period of medium and high permeability Oilfield&#x201d; (number: 2023ZZ22). The funder was not involved in the study design, collection, analysis, interpretation of data, the writing of this article, or the decision to submit it for publication.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>Authors ZF, CH, ML, YC, YJ, YL, and MT were employed by Petrochina Liaohe Oilfield Company.</p>
<p>The remaining author declares that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amari</surname>
<given-names>S. I.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Backpropagation and stochastic gradient descent method</article-title>. <source>Neurocomputing</source> <volume>5</volume> (<issue>4-5</issue>), <fpage>185</fpage>&#x2013;<lpage>196</lpage>. <pub-id pub-id-type="doi">10.1016/0925-2312(93)90006-O</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anifowose</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Abdulraheem</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Al-Shuhail</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A parametric study of machine learning techniques in petroleum reservoir permeability prediction by integrating seismic attributes and wireline data</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>176</volume>, <fpage>762</fpage>&#x2013;<lpage>774</lpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2019.01.110</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ashraf</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Anees</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mangi</surname>
<given-names>H. N.</given-names>
</name>
<name>
<surname>Ali</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>A core logging, machine learning and geostatistical modeling interactive approach for subsurface imaging of lenticular geobodies in a clastic depositional system, SE Pakistan</article-title>. <source>Nat. Resour. Res.</source> <volume>30</volume>, <fpage>2807</fpage>&#x2013;<lpage>2830</lpage>. <pub-id pub-id-type="doi">10.1007/s11053-021-09849-x</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhattacharya</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Carr</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Pal</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Comparison of supervised and unsupervised approaches for mudstone lithofacies classification: case studies from the Bakken and Mahantango-Marcellus Shale, USA</article-title>. <source>J. Nat. Gas Sci. Eng.</source> <volume>33</volume>, <fpage>1119</fpage>&#x2013;<lpage>1133</lpage>. <pub-id pub-id-type="doi">10.1016/j.jngse.2016.04.055</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biau</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Scornet</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A random forest guided tour</article-title>. <source>Test</source> <volume>25</volume>, <fpage>197</fpage>&#x2013;<lpage>227</lpage>. <pub-id pub-id-type="doi">10.1007/s11749-016-0481-7</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/a:1010933404324</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bressan</surname>
<given-names>T. S.</given-names>
</name>
<name>
<surname>de Souza</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Girelli</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Junior</surname>
<given-names>F. C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Evaluation of machine learning methods for lithology classification using geophysical data</article-title>. <source>Comput. and Geosciences</source> <volume>139</volume>, <fpage>104475</fpage>. <pub-id pub-id-type="doi">10.1016/j.cageo.2020.104475</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guestrin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>Xgboost: a scalable tree boosting system</article-title>,&#x201d; in <source>Proceedings of the 22nd acm sigkdd international conference on knowledge discovery and data mining</source>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohn</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Ghahramani</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jordan</surname>
<given-names>M. I.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Active learning with statistical models</article-title>. <source>J. Artif. Intell. Res.</source> <volume>4</volume>, <fpage>129</fpage>&#x2013;<lpage>145</lpage>. <pub-id pub-id-type="doi">10.1613/jair.295</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cui</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Danyushevsky</surname>
<given-names>L. V.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Determining the ore-forming processes of Dongshengmiao Zn-Pb-Cu deposit: evidence from the linear discriminant analysis of pyrite geochemistry</article-title>. <source>Ore Geol. Rev.</source> <volume>163</volume>, <fpage>105782</fpage>. <pub-id pub-id-type="doi">10.1016/j.oregeorev.2023.105782</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Delfiner</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Peyret</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Serra</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Automatic determination of lithology from well logs</article-title>. <source>SPE Form. Eval.</source> <volume>2</volume> (<issue>03</issue>), <fpage>303</fpage>&#x2013;<lpage>310</lpage>. <pub-id pub-id-type="doi">10.2118/13290-PA</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Lithology identification using kernel Fisher discriminant analysis with well logs</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>143</volume>, <fpage>95</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2016.02.017</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Lithofacies identification in carbonate reservoirs by multiple kernel Fisher discriminant analysis using conventional well logs: a case study in A oilfield, Zagros Basin, Iraq</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>210</volume>, <fpage>110081</fpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2021.110081</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Combining the back propagation neural network and particle swarm optimization algorithm for lithological mapping in North China</article-title>. <source>Remote Sens.</source> <volume>15</volume> (<issue>17</issue>), <fpage>4134</fpage>. <pub-id pub-id-type="doi">10.3390/rs15174134</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ehsan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>An integrated approach for the identification of lithofacies and clay mineralogy through Neuro-Fuzzy, cross plot, and statistical analyses, from well log data</article-title>. <source>J. Earth Syst. Sci.</source> <volume>129</volume>, <fpage>101</fpage>&#x2013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.1007/s12040-020-1365-5</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Goodfellow</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Courville</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <source>Deep learning</source>. <publisher-name>The MIT Press</publisher-name>.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Helm</surname>
<given-names>H. S.</given-names>
</name>
<name>
<surname>Basu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Athreya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Vogelstein</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Priebe</surname>
<given-names>C. E.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Distance-based positive and unlabeled learning for ranking</article-title>. <source>Pattern Recognit.</source> <volume>134</volume>, <fpage>109085</fpage>. <pub-id pub-id-type="doi">10.1016/j.patcog.2022.109085</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lau</surname>
<given-names>R. Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Time series k-means: a new k-means type smooth subspace clustering for time series data</article-title>. <source>Inf. Sci.</source> <volume>367</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1016/j.ins.2016.05.040</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>GBRTVis: online analysis of gradient boosting regression tree</article-title>. <source>J. Vis.</source> <volume>22</volume>, <fpage>125</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1007/s12650-018-0514-2</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jordan</surname>
<given-names>M. I.</given-names>
</name>
<name>
<surname>Mitchell</surname>
<given-names>T. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Machine learning: trends, perspectives, and prospects</article-title>. <source>Science</source> <volume>349</volume> (<issue>6245</issue>), <fpage>255</fpage>&#x2013;<lpage>260</lpage>. <pub-id pub-id-type="doi">10.1126/science.aaa8415</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kampffmeyer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>L&#xf8;kse</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bianchi</surname>
<given-names>F. M.</given-names>
</name>
<name>
<surname>Jenssen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Livi</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The deep kernelized autoencoder</article-title>. <source>Appl. Soft Comput.</source> <volume>71</volume>, <fpage>816</fpage>&#x2013;<lpage>825</lpage>. <pub-id pub-id-type="doi">10.1016/j.asoc.2018.07.029</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Borji</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>What are the receptive, effective receptive, and projective fields of neurons in convolutional neural networks?</article-title> <source>arXiv Prepr. arXiv 1705.07049</source>. <pub-id pub-id-type="doi">10.48550/arXiv.1705.07049</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Research progress on evaluation methods and factors influencing shale brittleness: a review</article-title>. <source>Energy Rep.</source> <volume>8</volume>, <fpage>4344</fpage>&#x2013;<lpage>4358</lpage>. <pub-id pub-id-type="doi">10.1016/j.egyr.2022.03.120</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Radwand</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Q. R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Quantitative analysis of pore complexity in lacustrine organic-rich shale and comparison to marine shale: insights from experimental tests and fractal theory</article-title>. <source>Energy Fuel</source> <volume>38</volume> (<issue>17</issue>), <fpage>16171</fpage>&#x2013;<lpage>16188</lpage>. <pub-id pub-id-type="doi">10.1021/acs.energyfuels.4c03095</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Mou</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>H. X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X. X.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>H. Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Pore structure and fractal characteristics of the marine shale of the Longmaxi Formation in the Changning area, southern Sichuan basin, China</article-title>. <source>Front. Earth Sci.</source> <volume>10</volume>, <fpage>1018274</fpage>. <pub-id pub-id-type="doi">10.3389/feart.2022.1018274</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Automatic lithology identification by applying LSTM to logging data: a case study in X tight rock reservoirs</article-title>. <source>IEEE Geoscience Remote Sens. Lett.</source> <volume>18</volume> (<issue>8</issue>), <fpage>1361</fpage>&#x2013;<lpage>1365</lpage>. <pub-id pub-id-type="doi">10.1109/LGRS.2020.3001282</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Madani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Arnaout</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mofrad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Arnaout</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Fast and accurate view classification of echocardiograms using deep learning</article-title>. <source>NPJ Digit. Med.</source> <volume>1</volume> (<issue>1</issue>), <fpage>6</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-017-0013-1</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>McDowell</surname>
<given-names>G. M.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Clayton</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Grau</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>1998</year>). &#x201c;<article-title>In-site nickel assay by prompt gamma neutron activation wireline logging</article-title>,&#x201d; in <source>SEG Annual Meeting</source> (<publisher-loc>New Orleans, Louisiana</publisher-loc>: <publisher-name>Society of Exploration Geophysicists</publisher-name>), <fpage>772</fpage>&#x2013;<lpage>775</lpage>. <pub-id pub-id-type="doi">10.1190/1.1820589</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Miclea</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Terebes</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Meza</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). &#x201c;<article-title>One dimensional convolutional neural networks and local binary patterns for hyperspectral image classification</article-title>,&#x201d; in <conf-name>2020 IEEE International Conference on Automation, Quality and Testing, Robotics (AQTR)</conf-name>, <conf-loc>Cluj-Napoca, Romania</conf-loc>, <conf-date>21-23 May 2020</conf-date>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1109/AQTR49680.2020.9129920</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miyahara</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Aihara</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lechner</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Quantum expectation-maximization algorithm</article-title>. <source>Phys. Rev. A</source> <volume>101</volume> (<issue>1</issue>), <fpage>012326</fpage>. <pub-id pub-id-type="doi">10.1103/PhysRevA.101.012326</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y. F.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Mechanical properties of coal and rock with different dip angles based on true triaxial unloading test</article-title>. <source>J. Min. Strata Control Eng.</source> <volume>6</volume> (<issue>2</issue>), <fpage>023037</fpage>. <pub-id pub-id-type="doi">10.13532/j.jmsce.cn10-1638/td.20231222.001</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rumelhart</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Hinton</surname>
<given-names>G. E.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Learning representations by back-propagating errors</article-title>. <source>Nature</source> <volume>323</volume> (<issue>6088</issue>), <fpage>533</fpage>&#x2013;<lpage>536</lpage>. <pub-id pub-id-type="doi">10.1038/323533a0</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sanyal</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Juprasert</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jubasche</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1980</year>). <article-title>An evaluation of a rhyolite-basalt-volcanic ash sequence from well logs</article-title>. <source>Log. Anal.</source> <volume>21</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>9</lpage>.</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saporetti</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>da Fonseca</surname>
<given-names>L. G.</given-names>
</name>
<name>
<surname>Pereira</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>de Oliveira</surname>
<given-names>L. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Machine learning approaches for petrographic classification of carbonate-siliciclastic rocks using well logs and textural information</article-title>. <source>J. Appl. Geophys.</source> <volume>155</volume>, <fpage>217</fpage>&#x2013;<lpage>225</lpage>. <pub-id pub-id-type="doi">10.1016/j.jappgeo.2018.06.012</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shan</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y. Z.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>Y. K.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>P. H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Shear mechanical properties of anchored rock mass under impact load</article-title>. <source>J. Min. Strata Control Eng.</source> <volume>3</volume> (<issue>4</issue>), <fpage>043034</fpage>. <pub-id pub-id-type="doi">10.13532/j.jmsce.cn10-1638/td.20211014.001</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Optimization of models for a rapid identification of lithology while drilling-A win-win strategy based on machine learning</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>176</volume>, <fpage>321</fpage>&#x2013;<lpage>341</lpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2019.01.006</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Omre</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Inversion of well logs into lithology classes accounting for spatial dependencies by using hidden markov models and recurrent neural networks</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>196</volume>, <fpage>107598</fpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2020.107598</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vichi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cavicchia</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Groenen</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Hierarchical means clustering</article-title>. <source>J. Classif.</source> <volume>39</volume> (<issue>3</issue>), <fpage>553</fpage>&#x2013;<lpage>577</lpage>. <pub-id pub-id-type="doi">10.1007/s00357-022-09419-7</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>A. X.</given-names>
</name>
<name>
<surname>Chukova</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>B. P.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Ensemble k-nearest neighbors based on centroid displacement</article-title>. <source>Inf. Sci.</source> <volume>629</volume>, <fpage>313</fpage>&#x2013;<lpage>323</lpage>. <pub-id pub-id-type="doi">10.1016/j.ins.2023.02.004</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Carr</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Ju</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Identifying organic-rich Marcellus Shale lithofacies by support vector machine classifier in the Appalachian basin</article-title>. <source>Comput. and Geosciences</source> <volume>64</volume>, <fpage>52</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1016/j.cageo.2013.12.002</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X. L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Seepage characteristic and fracture development of protected seam caused by mining protecting strata</article-title>. <source>J. Min. Strata Control Eng.</source> <volume>3</volume> (<issue>3</issue>), <fpage>033511</fpage>. <pub-id pub-id-type="doi">10.13532/j.jmsce.cn10-1638/td.20201215.001</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>An improved method for lithology identification based on a hidden Markov model and random forests</article-title>. <source>Geophysics</source> <volume>85</volume> (<issue>6</issue>), <fpage>IM27</fpage>&#x2013;<lpage>IM36</lpage>. <pub-id pub-id-type="doi">10.1190/geo2020-0108.1</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2021a</year>). <article-title>Semi-supervised active learning algorithm for SVMs based on QBC and tri-training</article-title>. <source>J. Ambient Intell. Humaniz. Comput.</source> <volume>12</volume>, <fpage>8809</fpage>&#x2013;<lpage>8822</lpage>. <pub-id pub-id-type="doi">10.1007/s12652-020-02665-w</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2021b</year>). <article-title>Deep learning of rock images for intelligent lithology identification</article-title>. <source>Comput. and Geosciences</source> <volume>154</volume>, <fpage>104799</fpage>. <pub-id pub-id-type="doi">10.1016/j.cageo.2021.104799</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>Z. K.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>J. Y.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>A real-time intelligent lithology identification method based on a dynamic felling strategy weighted random forest algorithm</article-title>. <source>Petroleum Sci.</source> <volume>21</volume> (<issue>2</issue>), <fpage>1135</fpage>&#x2013;<lpage>1148</lpage>. <pub-id pub-id-type="doi">10.1016/j.petsci.2023.09.011</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A safe screening rule for Laplacian support vector machine</article-title>. <source>Eng. Appl. Artif. Intell.</source> <volume>67</volume>, <fpage>309</fpage>&#x2013;<lpage>316</lpage>. <pub-id pub-id-type="doi">10.1016/j.engappai.2017.10.011</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Lithology identification technology of logging data based on deep learning model</article-title>. <source>Earth Sci. Inf.</source> <volume>16</volume> (<issue>3</issue>), <fpage>2545</fpage>&#x2013;<lpage>2557</lpage>. <pub-id pub-id-type="doi">10.1007/s12145-023-01051-2</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Application of machine learning in the identification of fluvial-lacustrine lithofacies from well logs: a case study from Sichuan Basin, China</article-title>. <source>J. Petroleum Sci. Eng.</source> <volume>215</volume>, <fpage>110610</fpage>. <pub-id pub-id-type="doi">10.1016/j.petrol.2022.110610</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhong</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Carr</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Application of a convolutional neural network in permeability prediction: a case study in the Jacksonburg-Stringtown oil field, West Virginia, USA</article-title>. <source>Geophysics</source> <volume>84</volume> (<issue>6</issue>), <fpage>B363</fpage>&#x2013;<lpage>B373</lpage>. <pub-id pub-id-type="doi">10.1190/geo2018-0588.1</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A gradient boosting decision tree algorithm combining synthetic minority oversampling technique for lithology identification</article-title>. <source>Geophysics</source> <volume>85</volume> (<issue>4</issue>), <fpage>WA147</fpage>&#x2013;<lpage>WA158</lpage>. <pub-id pub-id-type="doi">10.1190/geo2019-0429.1</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Reservoir characteristics and main controlling factors of the fourth member of shahejie formation in Niuxintuo area of western Liaohe sag</article-title>. <source>Special Oil and Gas Reservoirs</source> <volume>29</volume> (<issue>5</issue>), <fpage>49</fpage>. <comment>(in Chinese with an English abstract)</comment>. <pub-id pub-id-type="doi">10.3969/j.issn.1006-6535.2022.05.007</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>