<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Earth Sci.</journal-id>
<journal-title>Frontiers in Earth Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Earth Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-6463</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1608468</article-id>
<article-id pub-id-type="doi">10.3389/feart.2025.1608468</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Earth Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Interpretable machine learning approach for TBM tunnel crown convergence prediction with Bayesian optimization</article-title>
<alt-title alt-title-type="left-running-head">Hu et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/feart.2025.1608468">10.3389/feart.2025.1608468</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Hu</surname>
<given-names>Wanrui</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2998031/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Kai</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Heng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Luo</surname>
<given-names>Weibang</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Xingxing</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Guan</surname>
<given-names>Peng</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2726862/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>CISPDR Corporation</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Hubei Shenlong Geological Engineering Investigation Institute Co., Ltd.</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Engineering</institution>, <institution>China University of Geosciences</institution>, <addr-line>Wuhan</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Xinjiang Survey and Design Institute for Water Resources and Hydropower</institution>, <institution>Engineering Economics Institute</institution>, <addr-line>Urumqi</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Xinjiang Water Conservancy Development and Construction Group Co., Ltd.</institution>, <addr-line>Urumqi</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/168603/overview">Chong Xu</ext-link>, Ministry of Emergency Management (China), China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3037770/overview">You Zhang</ext-link>, China University of Geosciences (Wu Han), China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3054938/overview">Zhiyuan Xia</ext-link>, Kunming University of Science and Technology, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3072608/overview">Zida Liu</ext-link>, Central South University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Peng Guan, <email>20081002141@cug.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>30</day>
<month>06</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1608468</elocation-id>
<history>
<date date-type="received">
<day>09</day>
<month>04</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>06</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Hu, Wu, Liu, Luo, Li and Guan.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Hu, Wu, Liu, Luo, Li and Guan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Accurate prediction of crown convergence in Tunnel Boring Machine (TBM) tunnels is critical for ensuring construction safety, optimizing support design, and improving construction efficiency. This study proposes an interpretable machine learning method based on Bayesian optimization (BO) and SHapley Additive exPlanations (SHAP) for predicting crown convergence (CC) in TBM tunnels. Firstly, a dataset comprising 1,501 samples was constructed using tunnel engineering data. Then, six classical ML models, namely, Support Vector Regression, Decision Tree, Random Forest, Light Gradient Boosting Machine (LightGBM), eXtreme Gradient Boosting, and K-nearest neighbors&#x2014;were developed, and BO was applied to tune the hyperparameters of each model to achieve accurate prediction of CC. Subsequently, the SHAP method was adopted to interpret the LightGBM model, quantifying the contribution of each input feature to the model&#x2019;s predictions. The results indicate that the LightGBM model achieved the best prediction performance on the test set, with root mean squared error, mean absolute error, mean absolute percentage error, and determination coefficient values of 0.9122 mm, 0.6027 mm, 0.0644, and 0.9636, respectively; the average SHAP values for the six input features of the LightGBM model were ranked as follows: Time (0.1366) &#x3e; Rock grade (0.0871) &#x3e; Depth ratio (0.0528) &#x3e; Still arch (0.0200) &#x3e; Saturated compressive strength (0.0093) &#x3e; Rock quality designation (0.0047). Validation using data from a TBM water conveyance tunnel in Xinjiang, China, confirmed the method&#x2019;s practical utility, positioning it as an effective auxiliary tool for safer and more efficient TBM tunnel construction.</p>
</abstract>
<kwd-group>
<kwd>TBM tunnel</kwd>
<kwd>crown convergence prediction</kwd>
<kwd>machine learning</kwd>
<kwd>model explanation</kwd>
<kwd>bayesian optimization</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Geohazards and Georisks</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Tunnel Boring Machines (TBMs) are highly efficient and automated excavation equipment widely used in urban subways, hydraulic engineering, and transportation tunnels (<xref ref-type="bibr" rid="B18">Gao et al., 2021</xref>; <xref ref-type="bibr" rid="B16">Fu et al., 2023</xref>; <xref ref-type="bibr" rid="B50">Zhang et al., 2024</xref>). However, the deformation of surrounding rock during TBM construction remains a critical concern in the engineering community (<xref ref-type="bibr" rid="B34">Mahdevari et al., 2012</xref>). Crown convergence (CC) is a key indicator of tunnel stability, and excessive settlement can not only compromise the structural safety of the tunnel but also lead to construction delays and increased costs (<xref ref-type="bibr" rid="B14">Feng et al., 2019</xref>). Therefore, accurate prediction of crown convergence in TBM tunnels is crucial for ensuring construction safety, optimizing support design, and improving construction efficiency (<xref ref-type="bibr" rid="B3">Adoko and Wu, 2012</xref>).</p>
<p>Traditional methods for predicting tunnel convergence predominantly rely on empirical formulas and numerical simulations. For instance, Arora et al. (<xref ref-type="bibr" rid="B7">Arora and Gutierrez, 2021</xref>) presents a visco-elastic-plastic solution for deep circular tunnel under squeezing conditions, which can be used to determine the viscous behavior of tunnel wall convergence with time. <xref ref-type="bibr" rid="B8">Asadollahpour et al. (2014)</xref> determined the closure parameters of Panet Equation associated with face advance and time effect of a rock tunnel in six different monitoring stations. <xref ref-type="bibr" rid="B21">Huang et al. (2017)</xref> introduces a detailed numerical simulation to reveal the probabilistic response of tunnel convergence in spatial verified soils. <xref ref-type="bibr" rid="B11">Chen et al. (2018)</xref> proposed a case study on the stress and deformation characteristics of tunnels induced by close distance earth pressure balance shield under-crossing in sandy soil stratum. Empirical formulas are often based on limited engineering data and may not accurately reflect the deformation behavior of surrounding rock under complex geological conditions (<xref ref-type="bibr" rid="B47">Wang et al., 2021</xref>). Numerical simulations, despite their ability to model multi-factor interactions, are constrained by high computational costs and parameter sensitivity, hindering real-time engineering applications (<xref ref-type="bibr" rid="B20">Hu et al., 2024</xref>). With the rapid development of machine learning (ML) techniques, data-driven approaches have emerged as effective tools for solving complex engineering problems (<xref ref-type="bibr" rid="B9">Bo et al., 2023</xref>). ML methods can learn complex nonlinear relationships from large amounts of historical data, providing more accurate predictions. In recent years, ML methods have been widely applied in underground engineering due to their excellent feature analysis capabilities (<xref ref-type="bibr" rid="B35">Mahmoodzadeh et al., 2021</xref>; <xref ref-type="bibr" rid="B41">Ray et al., 2021</xref>; <xref ref-type="bibr" rid="B23">Kim et al., 2022</xref>; <xref ref-type="bibr" rid="B48">Xu et al., 2022</xref>; <xref ref-type="bibr" rid="B52">Zhang et al., 2022</xref>).</p>
<p>In the field of tunnel engineering, numerous studies have attempted to predict tunnel convergence using ML methods. For example, <xref ref-type="bibr" rid="B3">Adoko and Wu (2012)</xref> used an Adaptive Neuro-Fuzzy Inference System (ANFIS) to predict tunnel convergence, achieving satisfactory results. <xref ref-type="bibr" rid="B33">Mahdevari and Torabi (2012)</xref> employed an Artificial Neural Network (ANN) model to predict tunnel deformation, demonstrating that ANN models can achieve high prediction accuracy under complex geological conditions. <xref ref-type="bibr" rid="B39">Pan et al. (2012)</xref> combined the Firefly Algorithm (FA) with a Nonlinear Auto-Regressive (NAR) dynamic neural network to construct a dynamic nonlinear model for predicting surrounding rock convergence. <xref ref-type="bibr" rid="B36">Mahmoodzadeh et al. (2022)</xref> developed 5 ML models&#x2014;Deep Neural Network (DNN), Gaussian Process Regression (GPR), K-Nearest Neighbors (KNN), Decision Tree (DT), and Support Vector Regression (SVR)&#x2014;to accurately predict tunnel convergence. <xref ref-type="bibr" rid="B55">Zhou J. et al. (2023)</xref> collected 142 samples of highway tunnel deformation data and constructed six reliable ML models to predict tunnel convergence, using the Jellyfish Search Optimizer (JSO) for hyperparameter tuning. <xref ref-type="bibr" rid="B43">Sheini Dashtgoli et al. (2024)</xref> used FLAC 3D to create a dataset of 954 samples from shallow-buried tunnels and developed five tree-based ML algorithms to accurately predict the maximum convergence of unsupported shallow tunnels. <xref ref-type="bibr" rid="B6">An et al. (2024b)</xref> collected tunnel convergence data to build a dataset and used KNN, SVR, DT, RF, Extreme Gradient Boosting (XGBoost), Categorical Boosting (CatBoost), and Automated ML models to accurately predict tunnel convergence, and evaluated tunnel stability based on the prediction results in actual tunnel projects.</p>
<p>Despite the progress made in tunnel convergence prediction, several limitations still remain. Firstly, most studies focus solely on model prediction accuracy, neglecting model interpretability. The &#x201c;black-box&#x201d; nature of ML models makes their internal decision-making mechanisms difficult to understand, thus limiting their practical application in engineering (<xref ref-type="bibr" rid="B1">Adadi and Berrada, 2018</xref>; <xref ref-type="bibr" rid="B38">Naser, 2021</xref>). Secondly, many studies rely on limited datasets, which may not fully capture the deformation behavior of surrounding rock under complex geological conditions. Thirdly, the intelligent convergence prediction of TBM tunnels is very limited so far. SHapley Additive exPlanations (SHAP) is an explanation technique for ML models, which has been widely used in tunnel issues, such as explanation of tunnelling induced surface settlement prediction model (<xref ref-type="bibr" rid="B24">Li and Dias, 2024</xref>), tunnel squeezing prediction model (<xref ref-type="bibr" rid="B9">Bo et al., 2023</xref>), and tunnel convergence prediction model (<xref ref-type="bibr" rid="B6">An et al., 2024b</xref>). To address these issues, this study proposes a ML method based on Bayesian Optimization (BO) and SHAP for predicting crown convergence in TBM tunnels considering the successful application of SHAP in tunnel issues. A set of six classical ML models (SVM, DT, RF, LightGBM, XGBoost, and KNN) were adopted for CC prediction in TBM tunnels considering their successful application in tunnel issues (<xref ref-type="bibr" rid="B55">Zhou J. et al., 2023</xref>; <xref ref-type="bibr" rid="B6">An et al., 2024b</xref>; <xref ref-type="bibr" rid="B19">Guan et al., 2025</xref>). At the beginning, six input features were selected from geological, design, and time factors to construct a dataset containing 1,501 samples. Then, BO was adopted to tune the hyperparameters of six classical ML models (SVR, DT, RF, LightGBM, XGBoost, and KNN) to improve their prediction performance. Finally, the SHAP method was used to interpret the optimal model (LightGBM), quantifying the contribution of each input feature to the model&#x2019;s predictions. The novelties of this research are as follows: (1) It constructs a large-scale dataset with 1,501 samples, covering the deformation behavior of surrounding rock under complex geological conditions, which offers a solid data foundation for model training and testing. (2) It employs six classical ML models (SVR, DT, RF, LightGBM, XGBoost, and KNN) for CC prediction and uses BO to optimize the hyperparameters of each model, thereby improving prediction accuracy and generalization ability. (3) It applies the SHAP method to interpret the optimal model (LightGBM), quantifying the contribution of each input feature to the model&#x2019;s predictions and enhancing model interpretability. (4) The study validates the proposed method using data from a TBM water conveyance tunnel in Xinjiang, China, demonstrating that the approach can serve as an auxiliary tool for promoting safer and more efficient construction of TBM tunnel projects. This study not only helps engineers better understand the mechanisms of tunnel deformation but also provides a scientific basis for tunnel support design and construction decision-making, enabling safer and more efficient tunnel construction processes.</p>
<p>The remainder of this paper is organized as follows: <xref ref-type="sec" rid="s2">Section 2</xref> introduces the TBM tunnel crown convergence dataset constructed in this study; <xref ref-type="sec" rid="s3">Section 3</xref> presents the proposed method for predicting CC; <xref ref-type="sec" rid="s4">Section 4</xref> provides a detailed analysis of the prediction results; <xref ref-type="sec" rid="s5">Section 5</xref> displays the application of the proposed method in tunnel engineering; and <xref ref-type="sec" rid="s6">Section 6</xref> concludes the study and outlines its limitations.</p>
</sec>
<sec id="s2">
<title>2 Database</title>
<p>The selection of input features has a significant impact on the training effectiveness of ML models (<xref ref-type="bibr" rid="B6">An et al., 2024b</xref>). Proper selection of input features can enhance the prediction performance of ML models. In this study, nine input features were selected from geological, design, and time factors, including depth ratio (DR), rock grade (RG), saturated compressive strength (SCS), saturated tensile strength (STS), Rock Quality Designation (RQD), friction angle (FA), cohesion (C), steel arch height (SA), and time (T) since initial support completion. The output of the ML models is the CC of the tunnel. The dataset of this study is available via <ext-link ext-link-type="uri" xlink:href="https://github.com/Unic1124/data">https://github.com/Unic1124/data</ext-link>.</p>
<p>The depth ratio reflects the relationship between the tunnel depth and diameter. A higher depth ratio indicates more complex stress conditions in the surrounding rock, which can affect tunnel deformation (<xref ref-type="bibr" rid="B55">Zhou J. et al., 2023</xref>). The depth ratio is calculated using <xref ref-type="disp-formula" rid="e1">Equation 1</xref>.<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>D</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <italic>R</italic> is depth ratio, <italic>H</italic> is the depth of the tunnel roof, <italic>D</italic> is the diameter of the tunnel.</p>
<p>Geological factors (RG, RQD, FA, C, SCS, and STS) directly reflect the integrity, stability, and strength of the surrounding rock, which are decisive factors in tunnel deformation. The lower the RG, the better the engineering properties of the rock mass, and the higher the stability of the tunnel&#x2019;s surrounding rock, resulting in a relatively lower likelihood of deformation. A higher RQD value implies fewer internal rock fractures, better integrity, and stronger self-stability of the surrounding rock after tunnel excavation, thus limiting the extent of deformation. Greater values of FA and C enhance the rock&#x2019;s shear strength, improving its overall integrity and stability. Rocks with higher SCS and STS can better withstand various stresses generated during tunnel excavation, reducing the likelihood of deformation. Design factors (DR, SA) influence stress distribution and support effectiveness. The steel arch height reflects the stiffness of the initial support. Higher stiffness leads to better support effects and smaller tunnel deformation. A rational steel arch design can effectively disperse the stress of the surrounding rock and mitigate deformation caused by localized stress concentration (<xref ref-type="bibr" rid="B6">An et al., 2024b</xref>). Temporal factor (T) accounts for time-dependent deformation processes. Tunnel deformation is caused by the creep of surrounding rock, especially after the completion of initial support, where the creep effect significantly impacts tunnel stability. Therefore, the time since initial support completion is also an important factor influencing tunnel deformation (<xref ref-type="bibr" rid="B2">Adoko et al., 2013</xref>).</p>
<p>Sample data were extracted from tunnel sections of a TBM water conveyance tunnel in Xinjiang, China, to construct a dataset for model training and validation. Feature information was extracted from geological reports, design materials, construction schemes, and monitoring reports to form a dataset of 1,501 samples. This comprehensive dataset captures diverse geological and engineering conditions, ensuring robust model training. The data encompasses a wide range of geological and engineering conditions, reflecting the complex and diverse nature of TBM tunneling environments. It includes various input features as articulated above, which are critical factors influencing tunnel stability and deformation. The quality of the dataset is ensured through rigorous data cleaning and preprocessing steps, removing any inconsistencies or errors that could affect the ML model&#x2019;s performance. The dataset&#x2019;s representativeness is further validated by its alignment with the actual geological and engineering characteristics of the tunnel, making it a reliable benchmark for evaluating the predictive models.</p>
<p>Feature selection can avoid data redundancy and reduce the computational load of ML models (<xref ref-type="bibr" rid="B6">An et al., 2024b</xref>). Pearson correlation coefficients were calculated for each feature in the dataset using <xref ref-type="disp-formula" rid="e2">Equation 2</xref> to perform feature selection. A correlation coefficient (COR) greater than 0.6 indicates a strong correlation between two variables. As shown in <xref ref-type="fig" rid="F1">Figure 1a</xref>, the COR values between FA and DR, SCS, STS, RQD, and C were &#x2212;0.61, 0.85, 0.73, 0.79, and 0.92, respectively, indicating strong correlations between FA and these five variables. The COR values between C and SCS, RQD, and FA were 0.71, 0.82, and 0.93, respectively, suggesting strong correlations between C and these three features. The COR values between STS and SCS and RQD were 0.77 and 0.61, respectively. Therefore, STS, FA, and C were removed from the input features to avoid computational burden caused by data redundancy. After feature selection, the data distribution and correlations of the input and output features are shown in <xref ref-type="fig" rid="F1">Figures 1b,2</xref>, <xref ref-type="fig" rid="F2"/>, and the statistical characteristics of the dataset are presented in <xref ref-type="table" rid="T1">Table 1</xref>.<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>R</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:msqrt>
<mml:msqrt>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>where <italic>x</italic> and <italic>y</italic> are the values of the two variables, <inline-formula id="inf1">
<mml:math id="m3">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf2">
<mml:math id="m4">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x223c;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> are the means of <italic>x</italic> and <italic>y</italic>, respectively; and <italic>n</italic> is the number of the samples.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The correlation between the features: <bold>(a)</bold> before feature screening; <bold>(b)</bold> after feature screening.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g001.tif">
<alt-text content-type="machine-generated">Two heatmaps show correlation matrices for different variables. Heatmap (a) includes variables DR, RG, SCS, STS, RQD, FA, C, SA, T, and CC, with color gradients representing correlation values from negative to positive. Heatmap (b) displays a similar matrix with some variables omitted. Both include a color legend on the right, indicating correlation strength from -0.6 (pink) to 1.0 (green).</alt-text>
</graphic>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The distribution of the dataset after screening: <bold>(a)</bold> RG; <bold>(b)</bold> RQD; <bold>(c)</bold> SCS; <bold>(d)</bold> DR; <bold>(e)</bold> SA; <bold>(f)</bold> T; <bold>(g)</bold> CC.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g002.tif">
<alt-text content-type="machine-generated">Seven histograms with cumulative probability plots represent various datasets: (a) RG shows a concentrated count around 3 and 5; (b) RQD peaks at 80; (c) SCS has distinct counts at 60 and 100; (d) DR displays a spread with peaks between 56 and 62; (e) SA has a single peak at 140; (f) T is evenly distributed; (g) CC peaks around 7 to 12. Each graph has dual y-axes for count and cumulative probability.</alt-text>
</graphic>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The statistic characteristic of the dataset.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Statistic characteristic</th>
<th align="center">DR</th>
<th align="center">RG</th>
<th align="center">SCS (MPa)</th>
<th align="center">RQD (%)</th>
<th align="center">SA (mm)</th>
<th align="center">T (day)</th>
<th align="center">CC (mm)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Count</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
<td align="center">1,501</td>
</tr>
<tr>
<td align="center">Average</td>
<td align="center">61.45</td>
<td align="center">3.80</td>
<td align="center">72.58</td>
<td align="center">69.28</td>
<td align="center">94.30</td>
<td align="center">11.95</td>
<td align="center">10.89</td>
</tr>
<tr>
<td align="center">Std</td>
<td align="center">4.53</td>
<td align="center">0.85</td>
<td align="center">21.75</td>
<td align="center">16.83</td>
<td align="center">65.01</td>
<td align="center">9.10</td>
<td align="center">4.60</td>
</tr>
<tr>
<td align="center">Minimum</td>
<td align="center">51.78</td>
<td align="center">3</td>
<td align="center">55.00</td>
<td align="center">48.00</td>
<td align="center">0.00</td>
<td align="center">0.50</td>
<td align="center">1.10</td>
</tr>
<tr>
<td align="center">25%</td>
<td align="center">58.49</td>
<td align="center">3</td>
<td align="center">55.00</td>
<td align="center">48.00</td>
<td align="center">0.00</td>
<td align="center">4.50</td>
<td align="center">7.60</td>
</tr>
<tr>
<td align="center">Medium</td>
<td align="center">61.03</td>
<td align="center">4</td>
<td align="center">60.00</td>
<td align="center">70.40</td>
<td align="center">125.00</td>
<td align="center">9.50</td>
<td align="center">10.80</td>
</tr>
<tr>
<td align="center">75%</td>
<td align="center">65.26</td>
<td align="center">5</td>
<td align="center">101.00</td>
<td align="center">81.10</td>
<td align="center">150.00</td>
<td align="center">19.50</td>
<td align="center">14.60</td>
</tr>
<tr>
<td align="center">Maximum</td>
<td align="center">67.82</td>
<td align="center">5</td>
<td align="center">107.00</td>
<td align="center">94.80</td>
<td align="center">150.00</td>
<td align="center">31.50</td>
<td align="center">21.10</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec sec-type="methods" id="s3">
<title>3 Methods</title>
<p>In tunnel engineering, predicting the convergence of the tunnel is a complex issue involving the coupling of multiple factors, and traditional mechanical analysis methods often struggle to accurately capture its nonlinear characteristics. In recent years, ML methods, due to their strong data-driven capabilities and advantages in modeling complex relationships, have gradually become effective tools for solving such problems. This study develops six distinct ML models, which are subsequently trained and tested utilizing a dataset pertaining to TBM tunnel crown convergence. The hyperparameters of these ML models are meticulously optimized through the application of BO. Furthermore, the SHAP method is employed to provide interpretability to the models. The comprehensive workflow of this research is visually depicted in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Workflow of the proposed approach.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g003.tif">
<alt-text content-type="machine-generated">Flowchart of a machine learning process for model development and evaluation. Inputs, RG, RQD, SCS, DR, SA, T, and output CC, are divided into training (80%) and test (20%) sets. Models include SVR, DT, RF, LightGBM, XGBoost, and KNN. Performance is evaluated using RMSE, MAE, MAPE, and R&#xB2;. LightGBM is the optimal model. Model explanation uses Shapley values. Engineering applications show three charts (K63&#x26;&#x23;&#x2b;510, K63&#x26;&#x23;&#x2b;530, K63&#x26;&#x23;&#x2b;550) with model performance metrics.</alt-text>
</graphic>
</fig>
<sec id="s3-1">
<title>3.1 Machine learning algorithms</title>
<sec id="s3-1-1">
<title>3.1.1 Support Vector Regression</title>
<p>The Support Vector Machine (SVM) emerged from the Statistical Learning Theory proposed by Vapnik and colleagues in the 1990s and stands as a robust supervised learning algorithm (<xref ref-type="bibr" rid="B56">Zhou et al., 2022</xref>). Initially conceived for classification tasks, it was subsequently adapted for regression problems through the incorporation of the &#x3b5;-insensitive loss function, giving rise to Support Vector Regression (SVR). In regression problems, SVR seeks to find the optimal regression function (<xref ref-type="disp-formula" rid="e3">Equation 3</xref>) that minimizes the prediction error (<xref ref-type="bibr" rid="B49">Yin et al., 2023</xref>).<disp-formula id="e3">
<mml:math id="m5">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mi mathvariant="bold-italic">w</mml:mi>
<mml:mi>T</mml:mi>
</mml:msup>
<mml:mi>&#x3d5;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>b</mml:mi>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>where <inline-formula id="inf3">
<mml:math id="m6">
<mml:mrow>
<mml:mi>&#x3d5;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the kernel function that maps the input <bold>
<italic>x</italic>
</bold> into a high-dimensional feature space, <bold>
<italic>w</italic>
</bold> is the weight vector and <italic>b</italic> denotes the bias term.</p>
</sec>
<sec id="s3-1-2">
<title>3.1.2 Decision tree</title>
<p>The DT is a tree-based classification and regression model that is widely used in the fields of ML and data mining (<xref ref-type="bibr" rid="B27">Liu et al., 2022</xref>). For regression problems, the objective of the DT is to minimize the MSE for each leaf node. Suppose the input space is partitioned into <italic>M</italic> regions, denoted as <inline-formula id="inf4">
<mml:math id="m7">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, where each region corresponds to a leaf node with an output value <italic>c</italic>
<sub>
<italic>m</italic>
</sub>. The prediction of the decision tree can be expressed as <xref ref-type="disp-formula" rid="e4">Equation 4</xref>:<disp-formula id="e4">
<mml:math id="m8">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>M</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:mo>&#xb7;</mml:mo>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>where <inline-formula id="inf5">
<mml:math id="m9">
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xb7;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the indicator function that takes a value of one if <bold>
<italic>x</italic>
</bold> belongs to <italic>R</italic>
<sub>
<italic>m</italic>
</sub> and 0 otherwise; <italic>c</italic>
<sub>
<italic>m</italic>
</sub> is typically the mean of the target values of the samples within region <italic>R</italic>
<sub>
<italic>m</italic>
</sub>; and <inline-formula id="inf6">
<mml:math id="m10">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> represents the final prediction value of the decision tree.</p>
</sec>
<sec id="s3-1-3">
<title>3.1.3 Random Forest</title>
<p>RF is an ensemble learning algorithm based on DTs. By constructing multiple DTs and aggregating their predictions, the overall model achieves high prediction accuracy and stability (<xref ref-type="bibr" rid="B53">Zhao et al., 2024</xref>). The work process of RF is depicted in <xref ref-type="fig" rid="F4">Figure 4</xref>. The work process of RF is described by <xref ref-type="disp-formula" rid="e5">Equation 5</xref>.<disp-formula id="e5">
<mml:math id="m11">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>T</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>where <italic>T</italic> denotes the number of decision trees; <inline-formula id="inf7">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the prediction result of the <italic>t</italic>-th DT; and <inline-formula id="inf8">
<mml:math id="m13">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is the final prediction value of the RF.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Schematic diagram of the RF</p>
</caption>
<graphic xlink:href="feart-13-1608468-g004.tif">
<alt-text content-type="machine-generated">Diagram illustrating the random forest algorithm. Starting with a sample \(S\), the process involves bootstrapping to form samples \(S1, S2, S3, \ldots\). Decision trees are applied to these samples, creating multiple models. Each model outputs a class, resulting in \(K1, K2, \ldots, Kn\). Outputs are aggregated using averaging for regression or voting for classification, leading to a final result or classification.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s3-1-4">
<title>3.1.4 LightGBM</title>
<p>LightGBM is an efficient ML algorithm based on the gradient boosting framework (<xref ref-type="bibr" rid="B9">Bo et al., 2023</xref>). By incorporating techniques such as the Histogram algorithm and Gradient-based One-Sided Sampling, it significantly enhances the training speed and memory efficiency of the model while maintaining high prediction accuracy (<xref ref-type="bibr" rid="B22">Ke et al., 2017</xref>). The principle of LightGBM is based on Gradient Boosting Decision Trees (GBDT), which aims to achieve fast and accurate predictions on high-dimensional data. GBDT iteratively adds new DTs to progressively reduce the loss value of the objective function, as expressed in <xref ref-type="disp-formula" rid="e6">Equation 6</xref>. LightGBM optimizes <xref ref-type="disp-formula" rid="e6">Equation 6</xref> to incrementally improve prediction performance, ultimately achieving precise predictions.<disp-formula id="e6">
<mml:math id="m14">
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>where <italic>L</italic> denotes the objective function, <italic>n</italic> is the number of samples, <inline-formula id="inf9">
<mml:math id="m15">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the true value of the <italic>i</italic>-th sample, <inline-formula id="inf10">
<mml:math id="m16">
<mml:mrow>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the predicted value after the <italic>t</italic>-1-th iteration, and <inline-formula id="inf11">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the prediction of the <italic>i</italic>-th sample by the decision tree added in the <italic>t</italic>-th.</p>
<p>LightGBM employs the Histogram algorithm to discretize continuous feature values into multiple bins. Additionally, the introduction of Gradient-based One-Sided Sampling (GOSS) and Exclusive Feature Bundling (EFB) algorithms addresses the issue of excessive sample and feature counts, further optimizing computational efficiency. These optimization techniques endow LightGBM with significant advantages in handling large-scale datasets, making it well-suited for complex data analysis tasks in tunnel crown settlement prediction.</p>
</sec>
<sec id="s3-1-5">
<title>3.1.5 XGBoost</title>
<p>The principle of XGBoost is similar to that of LightGBM and is a gradient boosting-based ensemble learning algorithm. By optimizing the objective function and incorporating regularization terms, XGBoost further enhances the model&#x2019;s generalization ability and prediction accuracy (<xref ref-type="bibr" rid="B12">Chen and Guestrin, 2016</xref>). The XGBoost algorithm constructs DTs sequentially, specifically fitting the residuals between the predictions of the previous tree and the actual values, with the aim of progressively approximating the true values (<xref ref-type="bibr" rid="B44">Tang et al., 2024</xref>). This process continues until a predefined number of iterations is reached or a specific termination condition is satisfied. After training is completed, the model aggregates the predictions from all decision trees using a weighted summation method to generate the final prediction for each sample.</p>
<p>During the optimization of the loss function, XGBoost employs a second-order Taylor expansion to simplify calculations and introduces a regularization term into the objective function to effectively control model complexity and prevent overfitting. The objective function is formulated as <xref ref-type="disp-formula" rid="e7">Equation 7</xref>.<disp-formula id="e7">
<mml:math id="m18">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mtext>&#x200a;</mml:mtext>
<mml:mi>l</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>K</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mtext>&#x200a;</mml:mtext>
<mml:mi mathvariant="normal">&#x3a9;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>where <inline-formula id="inf12">
<mml:math id="m19">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the loss function, <inline-formula id="inf13">
<mml:math id="m20">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf14">
<mml:math id="m21">
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the true and predicted values of the <italic>i-</italic>th sample, respectively; and <italic>n</italic> is the number of samples. <inline-formula id="inf15">
<mml:math id="m22">
<mml:mrow>
<mml:mi mathvariant="normal">&#x3a9;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the regularization term, <italic>K</italic> is the number of decision trees, and <inline-formula id="inf16">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the complexity of the <italic>k</italic>-th tree.</p>
</sec>
<sec id="s3-1-6">
<title>3.1.6 K-nearest neighbors</title>
<p>The KNN algorithm is an instance-based learning method. Its core concept is to predict based on the label information of the <italic>k</italic> nearest neighbors to the input sample, using methods such as voting or weighted averaging (<xref ref-type="bibr" rid="B9">Bo et al., 2023</xref>; <xref ref-type="bibr" rid="B6">An et al., 2024b</xref>).</p>
</sec>
</sec>
<sec id="s3-2">
<title>3.2 Bayesian optimization</title>
<p>Hyperparameters have a significant impact on the predictive performance of ML models. Optimizing the hyperparameters of ML models can enhance their predictive performance (<xref ref-type="bibr" rid="B10">Chen and Seo, 2023</xref>). BO is an efficient global optimization method suitable for scenarios where the objective function is non-analytical, computationally expensive, or noisy (<xref ref-type="bibr" rid="B51">Zhang et al., 2020</xref>). It can address the limitations of grid search, which has a large computational burden, and random search, which is prone to getting stuck in local optima. BO constructs probabilistic models, such as Gaussian processes, to predict the behavior of the objective function and uses acquisition functions, such as expected improvement and upper confidence bound, to balance exploration and exploitation (<xref ref-type="bibr" rid="B15">Frazier, 2018</xref>). By doing so, BO can intelligently select evaluation points and iteratively approach the optimal solution. Its core idea is to update the posterior distribution using prior knowledge, thereby guiding the optimization process.</p>
</sec>
<sec id="s3-3">
<title>3.3 Performance evaluation metrics</title>
<p>Mathematical models play an indispensable role in understanding, simulating, and predicting complex environmental phenomena and systems. In various application domains, the evaluation of ML prediction results is an essential component (<xref ref-type="bibr" rid="B13">Feng et al., 2022</xref>; <xref ref-type="bibr" rid="B57">Zhou X. et al., 2023</xref>; <xref ref-type="bibr" rid="B28">Liu et al., 2024</xref>). To accurately assess the predictive performance of ML models, it is advisable to consider commonly used statistical metrics such as coefficient of determination (<inline-formula id="inf17">
<mml:math id="m24">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>), mean absolute error (MAE), mean absolute percentage error (MAPE), and root mean squared error (RMSE) (<xref ref-type="bibr" rid="B26">Li et al., 2023</xref>; <xref ref-type="bibr" rid="B5">An et al., 2024a</xref>). The calculations for these metrics are as <xref ref-type="disp-formula" rid="e8">Equations 8</xref>&#x2013;<xref ref-type="disp-formula" rid="e11">11</xref>.<disp-formula id="e8">
<mml:math id="m25">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
<disp-formula id="e9">
<mml:math id="m26">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="|">
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(9)</label>
</disp-formula>
<disp-formula id="e10">
<mml:math id="m27">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="|">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
<label>(10)</label>
</disp-formula>
<disp-formula id="e11">
<mml:math id="m28">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
<label>(11)</label>
</disp-formula>
</p>
</sec>
<sec id="s3-4">
<title>3.4 SHAP</title>
<p>Owing to the black-box nature of ML models, comprehending their output results presents a significant challenge (<xref ref-type="bibr" rid="B42">Ribeiro et al., 2016</xref>). In order to enhance the transparency of ML models, interpretability methods for these models have garnered substantial attention from researchers (<xref ref-type="bibr" rid="B25">Li et al., 2019</xref>; <xref ref-type="bibr" rid="B30">Love et al., 2023</xref>; <xref ref-type="bibr" rid="B29">Longo et al., 2024</xref>). The SHapley Additive exPlanations method is an additive explanation approach that interprets model output by calculating the contribution of each input variable to the prediction result, known as the SHAP value (<xref ref-type="bibr" rid="B32">Lundberg and Lee, 2017</xref>). SHAP method analyzes the impact of each feature to explain the model&#x2019;s prediction and sums the SHAP values of all features to obtain the final prediction result (<xref ref-type="bibr" rid="B31">Lundberg et al., 2019</xref>; <xref ref-type="bibr" rid="B40">Qu and Zhang, 2025</xref>). The calculation of SHAP values is given by <xref ref-type="disp-formula" rid="e12">Equation 12</xref>.<disp-formula id="e12">
<mml:math id="m29">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mtext>base</mml:mtext>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(12)</label>
</disp-formula>where <inline-formula id="inf18">
<mml:math id="m30">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the contribution of the <italic>k</italic>-th feature <inline-formula id="inf19">
<mml:math id="m31">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in the <italic>i</italic>-th sample to the model prediction <inline-formula id="inf20">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>; <inline-formula id="inf21">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mtext>base</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the baseline value. When <inline-formula id="inf22">
<mml:math id="m34">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, the feature has a positive impact on the model prediction; conversely, when <inline-formula id="inf23">
<mml:math id="m35">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, the feature has a negative impact.</p>
<p>For a prediction problem involving three parameter variables, the SHAP method is illustrated in <xref ref-type="fig" rid="F5">Figure 5</xref>. Here, <inline-formula id="inf24">
<mml:math id="m36">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> indicates the change in the current prediction value caused by input variable 1, which is a positive impact leading to an increase in the prediction value. Similarly, the addition of input variable two increases the current prediction value, while the addition of input variable 3 decreases the current prediction value by <inline-formula id="inf25">
<mml:math id="m37">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. SHAP method can effectively explains the model&#x2019;s prediction results, enhancing the understanding of how the model operates (<xref ref-type="bibr" rid="B17">Fu et al., 2022</xref>; <xref ref-type="bibr" rid="B46">Wang et al., 2023</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Schematic diagram of the SHAP method.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g005.tif">
<alt-text content-type="machine-generated">Flowchart demonstrating the calculation of predicted value \( y_i \) from a baseline value \( y_{\text{base}} \) using positive and negative contributions from Parameters 1 and 2. Positive contributions are shown with red arrows moving right, and negative contributions are indicated with blue arrows moving left. Each parameter has a specified function contribution \( f(x_{i1}) \) and \( f(x_{i2}) \).</alt-text>
</graphic>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>The BO process of the 6 ML models.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g006.tif">
<alt-text content-type="machine-generated">Line chart showing NMSE in millimeters versus iterations for six models: SVR, DT, RF, XGBoost, LightGBM, and KNN. Lines represent each model's performance over 100 iterations, with NMSE values from -0.005 to -0.030.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec id="s4">
<title>4 Result analysis</title>
<sec id="s4-1">
<title>4.1 Model development and hyperparameter optimization</title>
<p>The TBM tunnel crown convergence dataset was standardized and randomly divided into training and test sets in an 8:2 ratio for training and testing of the 6 ML models. After data standardization and train-test splitting, the training set and test set are divided into input data and output data, respectively. The input data and output data are input into the ML models using a function &#x2018;.fit ()&#x2019;, which is used to train the models. Similarly, the input data of the test set are input into the well-trained models to yield the output using the function &#x2018;.predict ()&#x2019;. The model development is conducted using the scikit-learn, xgboost and lightgbm packages with Python.</p>
<p>In this study, to achieve precise prediction of CC in TBM tunnels, six classical ML models&#x2014;SVR, DT, RF, LightGBM, XGBoost, and KNN&#x2014;were meticulously constructed and optimized using BO. The hyperparameters of each model were finely tuned via BO to enhance their predictive capabilities for CC. Negative Mean Squared Error (NMSE) was selected as the objective function for BO to minimize prediction error. To prevent overfitting, five-fold cross-validation was employed during model training. Each model underwent 100 optimization iterations, as shown in <xref ref-type="fig" rid="F6">Figure 6</xref>. The results showed that the NMSE of all six models gradually increased during the BO process and eventually converged, demonstrating the effectiveness of BO in improving the models&#x2019; performance on the training set.</p>
<p>The optimal hyperparameters and optimization results for the 6 ML models are presented in <xref ref-type="sec" rid="s13">Supplementary Tables A1-A6</xref> in the supplementary materials. Using the optimal hyperparameters from <xref ref-type="sec" rid="s13">Supplementary Tables A1-A6</xref>, the best-performing SVR, DT, RF, LightGBM, XGBoost, and KNN models were constructed for CC prediction of TBM tunnel. The prediction performance of the six models on the training set is shown in <xref ref-type="table" rid="T2">Table 2</xref>. From <xref ref-type="table" rid="T2">Table 2</xref>, it can be seen that the XGBoost model achieved the best prediction performance on the training set, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 0.7506, 0.5158, 0.0537, and 0.9744, respectively. The LightGBM model ranked second in prediction performance on the training set, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 0.8170, 0.4773, 0.0537, and 0.9673, respectively.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The performance metrics of tunnel convergence prediction models on training set.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">RMSE (mm)</th>
<th align="center">MAE (mm)</th>
<th align="center">MAPE</th>
<th align="center">
<italic>R</italic>
<sup>2</sup>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">SVR</td>
<td align="center">1.5246</td>
<td align="center">1.2680</td>
<td align="center">0.1509</td>
<td align="center">0.8900</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">1.0221</td>
<td align="center">0.6319</td>
<td align="center">0.0661</td>
<td align="center">0.9505</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">0.8769</td>
<td align="center">0.5296</td>
<td align="center">0.0540</td>
<td align="center">0.9636</td>
</tr>
<tr>
<td align="center">LightGBM</td>
<td align="center">0.8170</td>
<td align="center">0.4773</td>
<td align="center">0.0506</td>
<td align="center">0.9673</td>
</tr>
<tr>
<td align="center">XGBoost</td>
<td align="center">0.7506</td>
<td align="center">0.5158</td>
<td align="center">0.0537</td>
<td align="center">0.9744</td>
</tr>
<tr>
<td align="center">KNN</td>
<td align="center">1.3118</td>
<td align="center">0.8825</td>
<td align="center">0.0995</td>
<td align="center">0.9185</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To further underscore the superiority of the BO, Grey Wolf Optimization (GWO) (<xref ref-type="bibr" rid="B37">Mirjalili et al., 2014</xref>), Beluga Whale Optimization (BWO) (<xref ref-type="bibr" rid="B54">Zhong et al., 2022</xref>), and Genetic Algorithm (GA) (<xref ref-type="bibr" rid="B4">Albus et al., 2024</xref>) are used to optimize the hyperparameters of the LightGBM model to provide comparison. The optimization results are illustrated in <xref ref-type="fig" rid="F7">Figure 7</xref> and in <xref ref-type="table" rid="T3">Table 3</xref>. It can be observed from <xref ref-type="table" rid="T3">Table 3</xref> that the optimal NMSEs of the are &#x2212;0.0028 mm, which is smaller than the NMSE of BO. Moreover, the GWO, BWO, and GA take much more time than that of BO. The optimization comparison of LightGBM indicates the superior tuning efficiency of BO and better tuning performance.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Optimization curves of LightGBM model using GWO, BWO, and GA: <bold>(a)</bold> GWO; <bold>(b)</bold> BWO; <bold>(c)</bold> GA.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g007.tif">
<alt-text content-type="machine-generated">Three line graphs labeled (a), (b), and (c), showing NMSE in millimeters against iteration for population sizes of 20, 50, 100, and 150. Each graph compares the NMSE values across 100 iterations, with separate lines for each population size. The NMSE stabilizes after initial iterations in each graph, with slight variations for different populations.</alt-text>
</graphic>
</fig>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Comparison of hyperparameter tuning for LightGBM model using GWO, BWO, and GA.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Optimization method</th>
<th align="center">Hyperparameter</th>
<th align="center">Search space</th>
<th align="center">Population</th>
<th align="center">NMSE (mm)</th>
<th align="center">Time consumption (s)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="4" align="center">GWO</td>
<td rowspan="12" align="center">n_estimators<break/>max_depth<break/>learning_rate<break/>num_leaves</td>
<td rowspan="12" align="center">[10, 100]<break/>[3, 50]<break/>[1e-3, 1e-1]<break/>[5, 50]</td>
<td align="center">20</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">311</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">578</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">1,246</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">1,977</td>
</tr>
<tr>
<td rowspan="4" align="center">BWO</td>
<td align="center">20</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">94</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">233</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">390</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">592</td>
</tr>
<tr>
<td rowspan="4" align="center">GA</td>
<td align="center">20</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">301</td>
</tr>
<tr>
<td align="center">50</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">665</td>
</tr>
<tr>
<td align="center">100</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">1,270</td>
</tr>
<tr>
<td align="center">150</td>
<td align="center">&#x2212;0.0028</td>
<td align="center">8,299</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s4-2">
<title>4.2 Prediction results analysis</title>
<p>The prediction performance of the 6 ML models on the test set is shown in <xref ref-type="table" rid="T4">Table 4</xref>. From <xref ref-type="table" rid="T4">Table 4</xref>, it can be observed that the LightGBM model outperformed the other models in terms of prediction accuracy on the test set. The LightGBM model achieved the lowest RMSE (0.9211 mm), MAE (0.6027 mm), and MAPE (0.0644), as well as the highest <italic>R</italic>
<sup>2</sup> (0.9636). This indicates that among the 6 ML models evaluated, LightGBM is the best-performing model for predicting TBM tunnel crown convergence. The XGBoost model, which performed best on the training set (as shown in <xref ref-type="table" rid="T2">Table 2</xref>), also demonstrated satisfactory performance on the test set, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 1.2195 mm, 0.7760 mm, 0.0802, and 0.9227, respectively. Although XGBoost&#x2019;s performance on the test set was slightly inferior to LightGBM, it still ranked second, highlighting its good generalization ability on unseen data. The RF model also showed competitive performance, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 1.2979 mm, 0.8028 mm, 0.0839, and 0.9211, respectively. The RF model&#x2019;s prediction performance on the test set was comparable to that of XGBoost, indicating that ensemble methods are generally suitable for this prediction task.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>The performance metrics of tunnel convergence prediction models on test set.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">RMSE (mm)</th>
<th align="center">MAE (mm)</th>
<th align="center">MAPE</th>
<th align="center">R<sup>2</sup>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">SVR</td>
<td align="center">1.5971</td>
<td align="center">1.2990</td>
<td align="center">0.1682</td>
<td align="center">0.8805</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">1.5250</td>
<td align="center">0.9001</td>
<td align="center">0.0940</td>
<td align="center">0.8910</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">1.1279</td>
<td align="center">0.8028</td>
<td align="center">0.0938</td>
<td align="center">0.9211</td>
</tr>
<tr>
<td align="center">LightGBM</td>
<td align="center">0.9122</td>
<td align="center">0.6027</td>
<td align="center">0.0644</td>
<td align="center">0.9636</td>
</tr>
<tr>
<td align="center">XGBoost</td>
<td align="center">1.2192</td>
<td align="center">0.7760</td>
<td align="center">0.0802</td>
<td align="center">0.9227</td>
</tr>
<tr>
<td align="center">KNN</td>
<td align="center">1.6904</td>
<td align="center">1.1675</td>
<td align="center">0.1388</td>
<td align="center">0.8661</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Compared to ensemble methods, the DT model has a simpler structure but still provides reasonable prediction results, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 1.5250 mm, 0.9001 mm, 0.0940, and 0.8910, respectively. However, its performance was significantly lower than that of LightGBM, XGBoost, and RF models, suggesting that more complex models may be needed to capture the nonlinear relationships in the data. The SVR and KNN models had relatively higher prediction errors compared to the other models. The SVR model achieved RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 1.5971 mm, 1.2990 mm, 0.1682, and 0.8805, respectively, while the KNN model achieved values of 1.6904 mm, 1.1675 mm, 0.1388, and 0.8661, respectively. These results indicate that SVR and KNN are less effective than ensemble methods for the specific task of predicting TBM tunnel crown convergence, likely due to their limitations in handling complex nonlinear interactions between input features. For instance, the SVR model&#x2019;s training set performance is inferior to that of ensemble learning models like LightGBM, and it shows no significant improvement on the test set. This indicates that the SVR model may struggle to capture the complex nonlinear characteristics in TBM tunnel crown convergence data.</p>
<p>As indicated in <xref ref-type="table" rid="T2">Tables 2</xref>,<xref ref-type="table" rid="T4">4</xref>, the XGBoost, RF, DT, and KNN models exhibit markedly better predictive performance on the training set compared to the test set. This suggests potential overfitting during their training process. Conversely, the LightGBM model demonstrates comparable predictive performance on both the training and test sets, implying its strong generalization ability and lower risk of overfitting. This might be attributed to LightGBM&#x2019;s unique algorithmic optimization strategies, such as gradient boosting and the histogram algorithm, which effectively reduce overfitting.</p>
<p>
<xref ref-type="fig" rid="F8">Figure 8</xref> shows the prediction results of the six models on the test set, which depicts the actual versus predicted crown convergence values for each model, clearly comparing their prediction capabilities. Referring to <xref ref-type="fig" rid="F8">Figure 8</xref>, the LightGBM model&#x2019;s predicted values were closest to the actual values, with the smallest deviations, further confirming its superior performance. In contrast, the SVR and KNN models showed larger deviations from the actual values, especially for larger crown convergence values, indicating their limitations in accurately predicting extreme cases. Overall, the prediction performance of the 6 ML models for TBM tunnel crown convergence can be ranked as follows: LightGBM &#x3e; XGBoost &#x3e; RF &#x3e; DT &#x3e; SVR &#x3e; KNN. This outcome offers a key reference for choosing a TBM tunnel crown convergence prediction model. It indicates that in similar complex engineering tasks, opting for advanced ensemble learning models like LightGBM is likely to yield superior predictive results.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>CC prediction results of the 6 ML models on test set: <bold>(a)</bold> SVR; <bold>(b)</bold> DT; <bold>(c)</bold> RF; <bold>(d)</bold> LightGBM; <bold>(e)</bold> XGBoost; <bold>(f)</bold> KNN.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g008.tif">
<alt-text content-type="machine-generated">Scatter plots comparing ground truth versus predicted values for six models: (a) SVR with RMSE 1.5971, MAE 1.2990, MAPE 16.82%, R&#xB2; 0.8805; (b) DT with RMSE 1.5250, MAE 0.9001, MAPE 9.40%, R&#xB2; 0.8910; (c) RF with RMSE 1.2979, MAE 0.8028, MAPE 8.39%, R&#xB2; 0.9211; (d) LGBM with RMSE 0.9122, MAE 0.6027, MAPE 6.44%, R&#xB2; 0.9636; (e) XGBoost with RMSE 1.2195, MAE 0.7760, MAPE 8.02%, R&#xB2; 0.9227; (f) KNN with RMSE 1.6904, MAE 1.1675, MAPE 13.88%, R&#xB2; 0.8661. Each plot includes a line indicating the ideal fit and distribution histograms.</alt-text>
</graphic>
</fig>
<p>
<xref ref-type="table" rid="T5">Table 5</xref> shows the improvement in prediction performance of the LightGBM model compared to the other five models. From <xref ref-type="table" rid="T5">Table 5</xref>, it can be observed that the LightGBM model significantly outperformed the other 5 ML models in terms of prediction accuracy on the test set. Specifically, the LightGBM model achieved average improvements of 36.80%, 36.46%, 37.92%, and 7.58% in RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup>, respectively, compared to the XGBoost, RF, DT, SVR, and KNN models.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Improvements of LightGBM compared to the other 5 ML models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Model</th>
<th align="center">RMSE improvement</th>
<th align="center">MAE improvement</th>
<th align="center">MAPE improvement</th>
<th align="center">R<sup>2</sup> improvement</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">SVR</td>
<td align="center">42.88%</td>
<td align="center">53.60%</td>
<td align="center">61.70%</td>
<td align="center">9.44%</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">40.18%</td>
<td align="center">33.04%</td>
<td align="center">31.48%</td>
<td align="center">8.15%</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">29.27%</td>
<td align="center">24.92%</td>
<td align="center">23.21%</td>
<td align="center">4.62%</td>
</tr>
<tr>
<td align="center">XGBoost</td>
<td align="center">25.20%</td>
<td align="center">22.33%</td>
<td align="center">19.62%</td>
<td align="center">4.44%</td>
</tr>
<tr>
<td align="center">KNN</td>
<td align="center">46.04%</td>
<td align="center">48.38%</td>
<td align="center">53.60%</td>
<td align="center">11.26%</td>
</tr>
<tr>
<td align="center">Average</td>
<td align="center">36.80%</td>
<td align="center">36.46%</td>
<td align="center">37.92%</td>
<td align="center">7.58%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The results of this study have important implications for engineering practice, particularly in the context of TBM tunnel construction. Accurate prediction of crown convergence is crucial for ensuring the safety and stability of tunnels during and after construction. The LightGBM model, with its high prediction accuracy, can serve as a powerful tool for engineers to predict and mitigate potential risks associated with tunnel deformation. By integrating this model into real-time monitoring systems, engineers can make more informed decisions regarding support measures and construction schedules, leading to safer and more efficient tunnel construction processes.</p>
</sec>
<sec id="s4-3">
<title>4.3 Model explanation using SHAP</title>
<p>Although the developed ML models demonstrated satisfactory prediction performance in the task of predicting TBM tunnel crown convergence, particularly the LightGBM model, which achieved a low MAPE of 6.44% on the test set, the &#x201c;black-box&#x201d; nature of ML models makes their internal decision-making mechanisms difficult to understand (<xref ref-type="bibr" rid="B1">Adadi and Berrada, 2018</xref>). To explore the importance of input features and improve the interpretability of the ML models, the SHAP method was used to analyze the LightGBM model in depth, with the results shown in <xref ref-type="fig" rid="F9">Figure 9</xref>. According to <xref ref-type="fig" rid="F9">Figure 9</xref>, the average SHAP values of the six input variables were ranked as follows: T (0.1366) &#x3e; RG (0.0871) &#x3e; DR (0.0528) &#x3e; SA (0.0200) &#x3e; SCS (0.0093) &#x3e; RQD (0.0047). This ranking of average SHAP values reveals the importance of each input feature to the LightGBM model&#x2019;s predictions.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Model explanation results of LightGBM on the impact of the inputs using SHAP.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g009.tif">
<alt-text content-type="machine-generated">Bee swarm plot showing Shapley values for different features with a color gradient representing feature values from low (blue) to high (pink). Features include T, RG, DR, SA, SCS, and RQD. Higher average Shapley values indicate greater feature importance. T has the highest importance, while RQD has the lowest.</alt-text>
</graphic>
</fig>
<p>The time factor (T) had the highest average SHAP value (0.1366), indicating that it has the most significant impact on CC prediction. This result aligns with engineering practice, as tunnel deformation typically accumulates over time, especially after the completion of initial support, where the creep effect of surrounding rock significantly affects tunnel stability. Therefore, the time factor is a key variable in predicting CC. The RG had an average SHAP value of 0.0871, suggesting that it also has a significant impact on CC prediction. Rock grade reflects the strength and stability of the surrounding rock; higher grades indicate better stability and smaller tunnel deformation. The DR had an average SHAP value of 0.0528, demonstrating that it also has some influence on crown settlement prediction. However, compared to the T and RG, the influence of the depth ratio is relatively small. The SA had an average SHAP value of 0.0200, indicating that the stiffness of the initial support also contributes to crown settlement prediction. The steel arch height reflects the stiffness of the initial support; higher stiffness leads to better support effects and smaller tunnel deformation. However, compared to the T and RG, the influence of initial support is relatively small. The SCS and RQD had average SHAP values of 0.0093 and 0.0047, respectively, suggesting that they have a relatively small impact on CC prediction. This may be because these features are correlated with other features (e.g., RG), resulting in their independent contributions being relatively small.</p>
<p>
<xref ref-type="fig" rid="F10">Figure 10</xref> presents the dependence between the four most influential features. The relationship between T and RG indicates that time has less impact on CC at lower RG (better rock quality), but a more pronounced impact at higher RG (poorer rock quality). This aligns with engineering reality, as poor rock quality implies lower stability, leading to more significant deformation over time due to enhanced creep effects. RG and DR are interdependent, with DR exerting a greater influence on CC at higher RG. When rock quality is poor, the tunnel&#x2019;s stability mainly relies on geometric and burial factors, so changes in DR directly affect the stress environment and deformation characteristics, amplifying its impact on CC. DR and SA also show dependence, where steel arch height has a more noticeable effect on CC at larger DR. Deeply buried tunnels face higher geo-stress and deformation risks, and increasing steel arch height can better resist rock pressure and reduce deformation. In contrast, at smaller DR, steel arch height has a relatively minor impact on CC, as shallow tunnels have a milder stress environment, and lower steel arch height may already suffice for support.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Dependence plots of the input features: <bold>(a)</bold> T; <bold>(b)</bold> RG; <bold>(c)</bold> DR; <bold>(d)</bold> SA.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g010.tif">
<alt-text content-type="machine-generated">Four scatter plots demonstrate SHAP values for different variables: (a) SHAP values versus T, showing an upward trend; (b) SHAP values versus RG distributed around zero; (c) SHAP values versus DR, indicating varied distribution; (d) SHAP values versus SA, clustered around zero. Axes are labeled, and color bars indicate gradients for additional variables in each plot.</alt-text>
</graphic>
</fig>
<p>Through SHAP analysis, not only can the contribution of each input feature to the model&#x2019;s predictions be quantified, but the interactions between features and their specific impacts on CC can also be understood. This analysis not only improves model interpretability but also provides valuable insights for engineering practice. For example, engineers can focus on the factors that have the greatest impact on crown settlement (e.g., time factor and rock grade) based on the SHAP analysis results, enabling them to take more targeted support measures to ensure tunnel safety and stability.</p>
</sec>
<sec id="s4-4">
<title>4.4 Comparative analysis with related works</title>
<p>Previous studies have constructed reliable ML models for predicting tunnel convergence using different tunnel datasets. <xref ref-type="table" rid="T6">Table 6</xref> summarizes the prediction performance of ML models in tunnel convergence prediction tasks from related studies. According to the statistical results in <xref ref-type="table" rid="T6">Table 6</xref>, the LightGBM model developed in this study achieved an <italic>R</italic>
<sup>2</sup> of 0.9636 on the test set, which is higher than the <italic>R</italic>
<sup>2</sup> values of most ML models in the related studies. This indicates that the LightGBM model developed in this study has satisfactory prediction performance comparable to that of ML models from previous studies, providing an effective tool for the safe and efficient construction of TBM tunnels.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Summary of tunnel convergence prediction performance of different ML models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Literature</th>
<th align="center">Model</th>
<th align="center">Input features</th>
<th align="center">Count</th>
<th align="center">R<sup>2</sup>
</th>
<th align="center">MAPE (%)</th>
<th align="center">MAE (mm)</th>
<th align="center">RMSE (mm)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<xref ref-type="bibr" rid="B3">Adoko and Wu (2012)</xref>
</td>
<td align="center">ANFIS</td>
<td align="center">GEC, T, SRM, <italic>&#x3b3;</italic>, <italic>H</italic>, <italic>D</italic>
</td>
<td align="center">212</td>
<td align="center">0.95</td>
<td align="center">2.16</td>
<td align="center">-</td>
<td align="center">0.122</td>
</tr>
<tr>
<td align="center">
<xref ref-type="bibr" rid="B33">Mahdevari and Torabi (2012)</xref>
</td>
<td align="center">ANN</td>
<td rowspan="3" align="center">
<italic>E</italic>, <italic>C</italic>, GSI, UCS, <inline-formula id="inf26">
<mml:math id="m38">
<mml:mrow>
<mml:mi>v</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi>&#x3c6;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mtext>RQD</mml:mtext>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>y</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">H</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">20</td>
<td align="center">0.9334</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
</tr>
<tr>
<td rowspan="2" align="center">
<xref ref-type="bibr" rid="B34">Mahdevari et al. (2012)</xref>
</td>
<td align="center">ANN</td>
<td rowspan="2" align="center">18</td>
<td align="center">0.872</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
</tr>
<tr>
<td align="center">SVM</td>
<td align="center">0.965</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">-</td>
</tr>
<tr>
<td rowspan="2" align="center">
<xref ref-type="bibr" rid="B2">Adoko et al. (2013)</xref>
</td>
<td align="center">MARS</td>
<td rowspan="2" align="center">
<italic>&#x3b3;</italic>, SRM, T, <italic>&#x3d5;</italic>, <italic>C</italic>, <italic>X</italic>, <italic>E</italic>, <italic>H</italic>
</td>
<td rowspan="2" align="center">96</td>
<td align="center">0.95</td>
<td align="center">-</td>
<td align="center">0.42</td>
<td align="center">-</td>
</tr>
<tr>
<td align="center">ANN</td>
<td align="center">0.97</td>
<td align="center">-</td>
<td align="center">0.29</td>
<td align="center">-</td>
</tr>
<tr>
<td rowspan="8" align="center">
<xref ref-type="bibr" rid="B45">Torabi-Kaveh and Sarshari (2020)</xref>
</td>
<td align="center">MLP-ANN</td>
<td rowspan="8" align="center">NB, <inline-formula id="inf27">
<mml:math id="m39">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, RMR, <italic>C</italic>, <italic>H</italic>, <italic>&#x3d5;</italic>
</td>
<td rowspan="8" align="center">30%</td>
<td align="center">0.925</td>
<td align="center">-</td>
<td align="center">0.122</td>
<td align="center">0.169</td>
</tr>
<tr>
<td align="center">RBF-ANN</td>
<td align="center">0.81</td>
<td align="center">-</td>
<td align="center">0.218</td>
<td align="center">0.269</td>
</tr>
<tr>
<td align="center">MLR</td>
<td align="center">0.61</td>
<td align="center">-</td>
<td align="center">0.311</td>
<td align="center">0.386</td>
</tr>
<tr>
<td align="center">MNR</td>
<td align="center">0.648</td>
<td align="center">-</td>
<td align="center">0.299</td>
<td align="center">0.366</td>
</tr>
<tr>
<td align="center">SVR</td>
<td align="center">0.659</td>
<td align="center">-</td>
<td align="center">0.268</td>
<td align="center">0.385</td>
</tr>
<tr>
<td align="center">GPR</td>
<td align="center">0.53</td>
<td align="center">-</td>
<td align="center">0.3479</td>
<td align="center">0.4238</td>
</tr>
<tr>
<td align="center">RT</td>
<td align="center">0.53</td>
<td align="center">-</td>
<td align="center">0.3383</td>
<td align="center">0.4234</td>
</tr>
<tr>
<td align="center">ET</td>
<td align="center">0.63</td>
<td align="center">-</td>
<td align="center">0.3255</td>
<td align="center">0.3743</td>
</tr>
<tr>
<td rowspan="5" align="center">
<xref ref-type="bibr" rid="B36">Mahmoodzadeh et al. (2022)</xref>
</td>
<td align="center">DNN</td>
<td rowspan="5" align="center">GL, CS, C, CA, EM, H, W, E, X, UW, <inline-formula id="inf28">
<mml:math id="m40">
<mml:mrow>
<mml:mi>&#x3c6;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td rowspan="5" align="center">110</td>
<td align="center">0.9851</td>
<td align="center">23.63</td>
<td align="center">2.26</td>
<td align="center">4.461</td>
</tr>
<tr>
<td align="center">KNN</td>
<td align="center">0.9507</td>
<td align="center">38.75</td>
<td align="center">5.10</td>
<td align="center">8.549</td>
</tr>
<tr>
<td align="center">GPR</td>
<td align="center">0.9716</td>
<td align="center">31.06</td>
<td align="center">2.88</td>
<td align="center">6.393</td>
</tr>
<tr>
<td align="center">SVR</td>
<td align="center">0.9626</td>
<td align="center">34.03</td>
<td align="center">3.72</td>
<td align="center">6.846</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.9440</td>
<td align="center">35.83</td>
<td align="center">4.28</td>
<td align="center">8.319</td>
</tr>
<tr>
<td rowspan="6" align="center">
<xref ref-type="bibr" rid="B55">Zhou et al. (2023a)</xref>
</td>
<td align="center">JSO-BPNN</td>
<td rowspan="6" align="center">RMR, <italic>H</italic>, <italic>Q</italic>, <inline-formula id="inf29">
<mml:math id="m41">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c6;</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td rowspan="6" align="center">28</td>
<td align="center">0.692</td>
<td align="center">-</td>
<td align="center">5.914</td>
<td align="center">9.517</td>
</tr>
<tr>
<td align="center">JSO-GRNN</td>
<td align="center">0.875</td>
<td align="center">-</td>
<td align="center">3.570</td>
<td align="center">5.675</td>
</tr>
<tr>
<td align="center">JSO-ELM</td>
<td align="center">0.697</td>
<td align="center">-</td>
<td align="center">7.440</td>
<td align="center">9.032</td>
</tr>
<tr>
<td align="center">JSO-KELM</td>
<td align="center">0.885</td>
<td align="center">-</td>
<td align="center">3.808</td>
<td align="center">5.132</td>
</tr>
<tr>
<td align="center">JSO-LSSVM</td>
<td align="center">0.839</td>
<td align="center">-</td>
<td align="center">4.639</td>
<td align="center">6.119</td>
</tr>
<tr>
<td align="center">JSO-RF</td>
<td align="center">0.939</td>
<td align="center">-</td>
<td align="center">3.141</td>
<td align="center">3.958</td>
</tr>
<tr>
<td rowspan="7" align="center">
<xref ref-type="bibr" rid="B6">An et al. (2024b)</xref>
</td>
<td align="center">KNN</td>
<td rowspan="7" align="center">DR, RG, GT, SR, SA, T</td>
<td rowspan="7" align="center">547</td>
<td align="center">0.9398</td>
<td align="center">23.47</td>
<td align="center">1.8484</td>
<td align="center">2.7320</td>
</tr>
<tr>
<td align="center">SVR</td>
<td align="center">0.8616</td>
<td align="center">47.90</td>
<td align="center">3.3652</td>
<td align="center">4.1420</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.9620</td>
<td align="center">22.48</td>
<td align="center">1.4780</td>
<td align="center">2.1692</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">0.9804</td>
<td align="center">16.75</td>
<td align="center">0.9913</td>
<td align="center">1.5598</td>
</tr>
<tr>
<td align="center">XGBoost</td>
<td align="center">0.9887</td>
<td align="center">12.71</td>
<td align="center">0.7759</td>
<td align="center">1.1845</td>
</tr>
<tr>
<td align="center">CatBoost</td>
<td align="center">0.9870</td>
<td align="center">13.01</td>
<td align="center">0.7984</td>
<td align="center">1.2693</td>
</tr>
<tr>
<td align="center">Auto-ML</td>
<td align="center">0.9874</td>
<td align="center">13.38</td>
<td align="center">0.8225</td>
<td align="center">1.2480</td>
</tr>
<tr>
<td rowspan="6" align="center">This study</td>
<td align="center">SVR</td>
<td rowspan="6" align="center">DR, RG, GT, SR, SA, T</td>
<td rowspan="6" align="center">300</td>
<td align="center">0.8805</td>
<td align="center">16.82</td>
<td align="center">1.2990</td>
<td align="center">1.5971</td>
</tr>
<tr>
<td align="center">DT</td>
<td align="center">0.8910</td>
<td align="center">9.40</td>
<td align="center">0.9001</td>
<td align="center">1.5250</td>
</tr>
<tr>
<td align="center">RF</td>
<td align="center">0.9122</td>
<td align="center">8.39</td>
<td align="center">0.8028</td>
<td align="center">1.2979</td>
</tr>
<tr>
<td align="center">LightGBM</td>
<td align="center">0.9636</td>
<td align="center">6.44</td>
<td align="center">0.6027</td>
<td align="center">0.9122</td>
</tr>
<tr>
<td align="center">XGBoost</td>
<td align="center">0.9227</td>
<td align="center">8.05</td>
<td align="center">0.7760</td>
<td align="center">1.2195</td>
</tr>
<tr>
<td align="center">KNN</td>
<td align="center">0.8661</td>
<td align="center">13.88</td>
<td align="center">1.1675</td>
<td align="center">1.6904</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Note: SRM, surrounding rock mass rating index; GEC, ground engineering conditions rating index; &#x3b3;, Rock density; <italic>X</italic>, distance between monitoring station and working face; <italic>&#x3d5;</italic>, Friction angle; <italic>E</italic>, elasticity modulus; UCS, uniaxial compressive strength; GSI, geological strength index; <inline-formula id="inf30">
<mml:math id="m42">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Uniaxial tensile strength; <inline-formula id="inf31">
<mml:math id="m43">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>y</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Dry unit weight; <inline-formula id="inf32">
<mml:math id="m44">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b3;</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Saturation unit weight; <inline-formula id="inf33">
<mml:math id="m45">
<mml:mrow>
<mml:mi>v</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, Poisson&#x2019;s ratio; <inline-formula id="inf34">
<mml:math id="m46">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Unconfined compressive strength; GL, groundwater level; CA, Cross-section area; EM, excavation method; RMR, rock mass rating; <italic>W</italic>, tunnel width; UW, unit weight; NB, number of installed rock bolts; <italic>Q</italic>, rock mass quality index; <inline-formula id="inf35">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c6;</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Internal friction angle of rock mass; <inline-formula id="inf36">
<mml:math id="m48">
<mml:mrow>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Deformation modulus of rock mass; <inline-formula id="inf37">
<mml:math id="m49">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, Rock mass cohesion.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s4-5">
<title>4.5 Limitations</title>
<p>Despite the accurate prediction of crown convergence in the TBM water conveyance tunnel, this study has some limitations that need to be addressed. Firstly, the generalization of the dataset needs improvement as some features have overly limited values, such as SCS having only 4 values and SA having only 3 values. Secondly, the support form only considered the steel arch height as an input feature, neglecting the stiffness provided by other support measures such as rock bolts, steel mesh, and concrete. Thirdly, the dataset in this study was constructed from a single tunnel, lacking regional and engineering diversity.</p>
</sec>
</sec>
<sec id="s5">
<title>5 Engineering application</title>
<sec id="s5-1">
<title>5.1 Engineering background</title>
<p>The TBM water conveyance tunnel in Xinjiang, China, traverses strata primarily composed of tuffaceous sandstone, tuff, calcareous sandstone, tuff breccia, breccia lava, andesite porphyry, basalt porphyry, dacite porphyry, feldspar sandstone, crystal tuff sandstone, and carbonaceous sandstone from the Devonian and Carboniferous systems; siliceous slate and schistose tuff from the Silurian system; and conglomerate, sandstone, argillaceous sandstone, and carbonaceous mudstone from the Permian and Triassic systems. The tunnel also passes through Hercynian intrusions such as biotite granite, granodiorite, migmatitic granite, and potassic granite. Most of the tunnel sections are located in fresh rock masses with poorly developed fractures, and the surrounding rock is generally blocky and thick-layered, with relatively intact rock masses. The groundwater along the tunnel is mainly bedrock fissure water, with low flow rates. The tunnel crosses five major fault zones, with fracture zones generally ranging from 90 to 100 m wide and a maximum fracture zone width of 800 m.</p>
<p>The total length of the tunnel is 283.41 km, with a burial depth ranging from 150 to 774 m and an average burial depth of 428 m. The maximum burial depth is 774 m. The designed flow rate is 40.0 m<sup>3</sup>/s. The elevation of the tunnel inlet is 638.23 m, and the elevation of the outlet is 528.494 m. The TBM excavation length is 227.08 km, and the drill-and-blast method is used for 56.33 km. The drill-and-blast method uses a horseshoe-shaped cross-section with an excavation diameter ranging from 6.56 to 8.96 m, while the TBM uses a circular cross-section with an excavation diameter of 7.00 m. Secondary lining is mainly applied in sections with poor rock integrity (Class III) and in Class IV and V rock sections, using C35 reinforced concrete lining. In sections with better rock integrity (Class II and III), shotcrete and rock bolting are used as the primary support.</p>
</sec>
<sec id="s5-2">
<title>5.2 Crown convergence prediction results</title>
<p>Six typical sections (K63 &#x2b; 510, K63 &#x2b; 530, K63 &#x2b; 550, K63 &#x2b; 630, K63 &#x2b; 650, and K63 &#x2b; 670) were selected from a TBM water conveyance tunnel in Xinjiang, China and used to validate the LightGBM model&#x2019;s prediction performance. The geological and design information of the tunnel sections are displayed in <xref ref-type="table" rid="T7">Table 7</xref>. To enhance the understanding of engineers in relevant fields, the implementing steps of the application in real-world TBM tunnels are illustrated in <xref ref-type="fig" rid="F11">Figure 11</xref>. To make it more convenient for the workers on site to use, a graphical user interface is designed to implement these models, as shown in <xref ref-type="fig" rid="F12">Figure 12</xref>. In this user interface, the users can choose different well-trained models to predict the CC of the tunnel sections with the input features of the sections. The prediction results can be shown as a curve plot to enhance user&#x2019;s understanding.</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Description of the four tunnel sections.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Tunnel section</th>
<th align="center">Tunnel depth (m)</th>
<th align="center">Rock grade</th>
<th align="center">SCS (MPa)</th>
<th align="center">RQD (%)</th>
<th align="center">Steel arch height (mm)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">K63 &#x2b; 510</td>
<td align="center">527</td>
<td align="center">IV</td>
<td align="center">55</td>
<td align="center">48</td>
<td align="center">150</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 530</td>
<td align="center">525</td>
<td align="center">V</td>
<td align="center">55</td>
<td align="center">48</td>
<td align="center">150</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 550</td>
<td align="center">526</td>
<td align="center">V</td>
<td align="center">49</td>
<td align="center">48</td>
<td align="center">150</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 630</td>
<td align="center">522</td>
<td align="center">V</td>
<td align="center">55</td>
<td align="center">48</td>
<td align="center">150</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 650</td>
<td align="center">520</td>
<td align="center">IV</td>
<td align="center">69</td>
<td align="center">73.2</td>
<td align="center">150</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 710</td>
<td align="center">509</td>
<td align="center">IV</td>
<td align="center">55</td>
<td align="center">73.2</td>
<td align="center">150</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>Workflow of crown convergence prediction for real-world TBM tunnels.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g011.tif">
<alt-text content-type="machine-generated">Flowchart detailing the prediction process for tunnel crown convergence. It includes five steps: Step 1: Engineering geological analysis of the tunnel section. Step 2: Value determination of input features. Step 3: Data standardization. Step 4: Crown convergence prediction using a well-trained LightGBM model. Step 5: Crown convergence curve plotting.</alt-text>
</graphic>
</fig>
<fig id="F12" position="float">
<label>FIGURE 12</label>
<caption>
<p>User interface to implement the machine learning models.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g012.tif">
<alt-text content-type="machine-generated">Graph from the Tunnel Convergence Prediction System showing convergence values over 17.5 days. The curve, labeled &#x22;Predicted CC,&#x22; demonstrates increasing convergence from 2 millimeters to approximately 16 millimeters, stabilizing around day 12. The interface includes model configuration and buttons for loading data, predicting, and exporting results.</alt-text>
</graphic>
</fig>
<p>
<xref ref-type="table" rid="T8">Table 8</xref> shows the prediction performance metrics of the LightGBM model for these six sections. According to <xref ref-type="table" rid="T8">Table 8</xref>, the LightGBM model achieved high prediction accuracy in the K63 &#x2b; 510, K63 &#x2b; 530, K63 &#x2b; 650 and K63 &#x2b; 670 sections, with <italic>R</italic>
<sup>2</sup> values of 0.9951, 0.9941, 0.9822 and 0.9882, respectively. In the K63 &#x2b; 550 and K63 &#x2b; 630 sections, the prediction accuracy was slightly lower, with <italic>R</italic>
<sup>2</sup> values of 0.8093 and 0.9275, respectively.</p>
<table-wrap id="T8" position="float">
<label>TABLE 8</label>
<caption>
<p>The performance metrics of tunnel convergence prediction for the six tunnel sections using LightGBM.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Section</th>
<th align="center">RMSE (mm)</th>
<th align="center">MAE (mm)</th>
<th align="center">MAPE (%)</th>
<th align="center">R<sup>2</sup>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">K63 &#x2b; 510</td>
<td align="center">0.2825</td>
<td align="center">0.2259</td>
<td align="center">2.18</td>
<td align="center">0.9951</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 530</td>
<td align="center">0.4547</td>
<td align="center">0.4014</td>
<td align="center">4.50</td>
<td align="center">0.9941</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 550</td>
<td align="center">2.2889</td>
<td align="center">1.8748</td>
<td align="center">12.44</td>
<td align="center">0.8093</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 630</td>
<td align="center">1.3249</td>
<td align="center">1.0993</td>
<td align="center">7.50</td>
<td align="center">0.9275</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 650</td>
<td align="center">0.6763</td>
<td align="center">0.5145</td>
<td align="center">6.22</td>
<td align="center">0.9822</td>
</tr>
<tr>
<td align="center">K63 &#x2b; 710</td>
<td align="center">0.4308</td>
<td align="center">0.2922</td>
<td align="center">2.87</td>
<td align="center">0.9882</td>
</tr>
<tr>
<td align="center">Average</td>
<td align="center">0.9097</td>
<td align="center">0.7347</td>
<td align="center">5.95</td>
<td align="center">0.9494</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Overall, the LightGBM model achieved an average RMSE of 0.9097 mm, an average MAE of 0.7347 mm, an average MAPE of 5.95%, and an average <italic>R</italic>
<sup>2</sup> of 0.9494 across the six sections. This indicates that the LightGBM model has high prediction accuracy and generalization ability in actual TBM tunnel engineering. Additionally, <xref ref-type="fig" rid="F13">Figure 13</xref> shows the prediction curves of the LightGBM model for the six sections compared to the actual observed values. It can be observed that the model&#x2019;s prediction curves closely match the actual observed values in most sections, particularly in the K63 &#x2b; 510, K63 &#x2b; 530, K63 &#x2b; 650, and K63 &#x2b; 710 sections, where the prediction curves almost completely overlap with the actual observed values. In the K63 &#x2b; 550 and K63 &#x2b; 630 sections, although the prediction errors increased slightly, the model still captured the trend of crown convergence well, with small deviations between the prediction curves and the actual observed values.</p>
<fig id="F13" position="float">
<label>FIGURE 13</label>
<caption>
<p>Prediction curves of the six tunnel sections yielded by LightGBM model.</p>
</caption>
<graphic xlink:href="feart-13-1608468-g013.tif">
<alt-text content-type="machine-generated">Six graphs compare measured and predicted cumulative carbon (CC) in millimeters over 30 days at six locations: K63&#x26;&#x23;&#x2b;510, K63&#x26;&#x23;&#x2b;530, K63&#x26;&#x23;&#x2b;550, K63&#x26;&#x23;&#x2b;630, K63&#x26;&#x23;&#x2b;650, and K63&#x26;&#x23;&#x2b;710. Each graph includes statistical metrics: RMSE, MAE, MAPE, and R-squared, showing close alignment between measured and predicted values. The highest MAPE is 12.44% at K63&#x26;&#x23;&#x2b;550, indicating greater variance, while other locations demonstrate stronger correlation.</alt-text>
</graphic>
</fig>
<p>The high prediction accuracy and generalization ability of the LightGBM model in actual TBM tunnel engineering provide strong support for tunnel support design and construction decision-making. By integrating this model into real-time monitoring systems, engineers can predict crown convergence in real-time and adjust support measures and construction schedules accordingly, ensuring the safety and stability of the tunnel. For instance, in the K63 &#x2b; 550 and K63 &#x2b; 630 sections, despite a slight increase in prediction errors, the model still captures the crown convergence trend effectively, offering a reliable basis for risk warning and decision support during construction.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s6">
<title>6 Conclusion</title>
<p>This study proposes an interpretable ML method based on BO and SHAP for predicting crown convergence in TBM tunnels. Firstly, a large-scale dataset containing 1,501 samples was constructed. Then, six classical ML models (SVM, DT, RF, LightGBM, XGBoost, and KNN) were developed, and BO was applied to tune the hyperparameters of each model to achieve accurate prediction of crown convergence. Subsequently, the SHAP method was used to interpret the LightGBM model, quantifying the contribution of each input feature to the model&#x2019;s predictions and improving model interpretability. Finally, the LightGBM model was validated using data from six sections of a TBM water conveyance tunnel in Xinjiang, China. The results show that:<list list-type="simple">
<list-item>
<p>(1) The LightGBM model achieved the best prediction performance on the test set, with RMSE, MAE, MAPE, and <italic>R</italic>
<sup>2</sup> values of 0.9122 mm, 0.6027 mm, 0.0644, and 0.9636, respectively. The prediction performance of the 6 ML models was ranked as follows: LightGBM &#x3e; XGBoost &#x3e; RF &#x3e; DT &#x3e; SVR &#x3e; KNN.</p>
</list-item>
<list-item>
<p>(2) SHAP analysis revealed the contribution of input features to the LightGBM model&#x2019;s predictions. The average SHAP values of the six input features were ranked as follows: T (0.1366) &#x3e; RG (0.0871) &#x3e; DR (0.0528) &#x3e; SA (0.0200) &#x3e; SCS (0.0093) &#x3e; RQD (0.0047).</p>
</list-item>
<list-item>
<p>(3) In practical engineering applications, the LightGBM model achieved an average RMSE of 0.9097 mm, an average MAE of 0.7347 mm, an average MAPE of 5.95%, and an average <italic>R</italic>
<sup>2</sup> of 0.9494 across six sections, demonstrating accurate prediction of crown convergence in the TBM water conveyance tunnel.</p>
</list-item>
</list>
</p>
<p>Future research will incorporate the comprehensive stiffness of the support structure as an input feature to improve the model&#x2019;s prediction accuracy. Moreover, data from other tunnels will be collected to increase the diversity of the dataset and improve the generalization ability of the ML models.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="s8">
<title>Author contributions</title>
<p>WH: Conceptualization, Validation, Investigation, Writing &#x2013; original draft, Methodology, Formal Analysis, Data curation. KW: Writing &#x2013; original draft, Software, Validation, Data curation, Investigation. HL: Data curation, Visualization, Methodology, Writing &#x2013; original draft, Formal Analysis, Investigation. WL: Validation, Data curation, Investigation, Writing &#x2013; original draft, Formal Analysis, Software. XL: Formal Analysis, Writing &#x2013; review and editing, Data curation, Investigation. PG: Funding acquisition, Resources, Writing &#x2013; review and editing, Project administration, Supervision.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research and/or publication of this article. This work was supported by the China Postdoctoral Science Foundation (2024M752746, 2024T170760) and Education Department of Hunan Province of China (24B0915).</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>Authors WH and HL were employed by CISPDR Corporation. Author KW was employed by Hubei Shenlong Geological Engineering Investigation Institute Co., Ltd. Author XL was employed by Xinjiang Water Conservancy Development and Construction Group Co., Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
<p>The reviewer YZ declared a shared affiliation with the author PG to the handling editor at time of review.</p>
</sec>
<sec sec-type="ai-statement" id="s11">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec sec-type="supplementary-material" id="s13">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/feart.2025.1608468/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/feart.2025.1608468/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.docx" id="SM2" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table5.docx" id="SM3" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.docx" id="SM4" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table4.docx" id="SM5" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table6.docx" id="SM6" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.xlsx" id="SM7" mimetype="application/xlsx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adadi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Berrada</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Peeking inside the black-box: a survey on explainable artificial intelligence (xai)</article-title>. <source>IEEE Access</source> <volume>6</volume>, <fpage>52138</fpage>&#x2013;<lpage>52160</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2018.2870052</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adoko</surname>
<given-names>A.-C.</given-names>
</name>
<name>
<surname>Jiao</surname>
<given-names>Y.-Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.-H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Predicting tunnel convergence using multivariate adaptive regression spline and artificial neural network</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>38</volume>, <fpage>368</fpage>&#x2013;<lpage>376</lpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2013.07.023</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adoko</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Estimation of convergence of a high-speed railway tunnel in weak rocks using an adaptive neuro-fuzzy inference system (ANFIS) approach</article-title>. <source>J. Rock Mech. Geotech. Eng.</source> <volume>4</volume>, <fpage>11</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.3724/SP.J.1235.2012.00011</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Albus</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hornek</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kraus</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huber</surname>
<given-names>M. F.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Towards scalability for resource reconfiguration in robotic assembly line balancing problems using a modified genetic algorithm</article-title>. <source>J. Intell. Manuf.</source> <volume>36</volume>, <fpage>1175</fpage>&#x2013;<lpage>1199</lpage>. <pub-id pub-id-type="doi">10.1007/s10845-023-02292-0</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Jiao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2024a</year>). <article-title>Explainable deep learning-based dynamic prediction of surface settlement considering temporal characteristics during deep excavation</article-title>. <source>Appl. Soft Comput.</source> <volume>167</volume>, <fpage>112273</fpage>. <pub-id pub-id-type="doi">10.1016/j.asoc.2024.112273</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Jiao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2024b</year>). <article-title>Optimized machine learning models for predicting crown convergence of plateau mountain tunnels</article-title>. <source>Transp. Geotech.</source> <volume>46</volume>, <fpage>101254</fpage>. <pub-id pub-id-type="doi">10.1016/j.trgeo.2024.101254</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arora</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gutierrez</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Viscous-elastic-plastic response of tunnels in squeezing ground conditions: analytical modeling and experimental validation</article-title>. <source>Int. J. Rock Mech. Min.</source> <volume>146</volume>, <fpage>104888</fpage>. <pub-id pub-id-type="doi">10.1016/j.ijrmms.2021.104888</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asadollahpour</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Rahmannejad</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Asghari</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Abdollahipour</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Back analysis of closure parameters of Panet equation and Burger&#x2019;s model of Babolak water tunnel conveyance</article-title>. <source>Int. J. Rock Mech. Min. Sci.</source> <volume>68</volume>, <fpage>159</fpage>&#x2013;<lpage>166</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijrmms.2014.02.017</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Robust model for tunnel squeezing using Bayesian optimized classifiers with partially missing database</article-title>. <source>Undergr. Space</source> <volume>10</volume>, <fpage>91</fpage>&#x2013;<lpage>117</lpage>. <pub-id pub-id-type="doi">10.1016/j.undsp.2022.11.001</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Seo</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Prediction of rock mass class ahead of TBM excavation face by ML and DL algorithms with Bayesian TPE optimization and SHAP feature analysis</article-title>. <source>Acta Geotech.</source> <volume>18</volume>, <fpage>3825</fpage>&#x2013;<lpage>3848</lpage>. <pub-id pub-id-type="doi">10.1007/s11440-022-01779-z</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>R.-P.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>X.-T.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>Z.-Q.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Deformation and stress characteristics of existing twin tunnels induced by close-distance EPBS under-crossing</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>82</volume>, <fpage>468</fpage>&#x2013;<lpage>481</lpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2018.08.059</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guestrin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>XGBoost: a scalable tree boosting system</article-title>,&#x201d; in <source>Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining</source> (<publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>), <fpage>785</fpage>&#x2013;<lpage>794</lpage>. <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y.-F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>An improved artificial bee colony-random forest (IABC-RF) model for predicting the tunnel deformation due to an adjacent foundation pit excavation</article-title>. <source>Undergr. Space</source> <volume>7</volume>, <fpage>514</fpage>&#x2013;<lpage>527</lpage>. <pub-id pub-id-type="doi">10.1016/j.undsp.2021.11.004</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jimenez</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Senent</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Prediction of time-dependent tunnel convergences using a Bayesian updating approach</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>94</volume>, <fpage>103118</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2019.103118</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Frazier</surname>
<given-names>P. I.</given-names>
</name>
</person-group> (<year>2018</year>). <source>A tutorial on bayesian optimization</source>. <pub-id pub-id-type="doi">10.48550/arXiv.1807.02811</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ponnarasu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A hybrid deep learning approach for dynamic attitude and position prediction in tunnel construction considering spatio-temporal patterns</article-title>. <source>Expert Syst. Appl.</source> <volume>212</volume>, <fpage>118721</fpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2022.118721</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tiong</surname>
<given-names>R. L. K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Data-driven real-time advanced geological prediction in tunnel construction using a hybrid deep learning approach</article-title>. <source>Autom. Constr.</source> <volume>146</volume>, <fpage>104672</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2022.104672</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>TBM penetration rate prediction based on the long short-term memory neural network</article-title>. <source>Undergr. Space</source> <volume>6</volume>, <fpage>718</fpage>&#x2013;<lpage>731</lpage>. <pub-id pub-id-type="doi">10.1016/j.undsp.2020.01.003</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Pei</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2025</year>). <article-title>Tunnel squeezing prediction based on partially missing dataset and optimized machine learning models</article-title>. <source>Front. Earth Sci.</source> <volume>13</volume>. <pub-id pub-id-type="doi">10.3389/feart.2025.1511413</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Ground settlement and tunnel response due to twin-curved shield tunnelling in soft ground with small clear distance</article-title>. <source>J. Rock Mech. Geotech. Eng.</source> <volume>16</volume>, <fpage>3122</fpage>&#x2013;<lpage>3135</lpage>. <pub-id pub-id-type="doi">10.1016/j.jrmge.2024.06.005</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>H. W.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Influence of spatial variability of soil Young&#x2019;s modulus on tunnel convergence in soft soils</article-title>. <source>Eng. Geol.</source> <volume>228</volume>, <fpage>357</fpage>&#x2013;<lpage>370</lpage>. <pub-id pub-id-type="doi">10.1016/j.enggeo.2017.09.011</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ke</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Finley</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). &#x201c;<article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title>,&#x201d; in <source>Advances in neural information processing systems</source> (<publisher-name>Long Beach, CA, USA: 31st Conference on Neural Information Processing Systems (NIPS 2017)</publisher-name>).</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pham</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Oh</surname>
<given-names>J.-Y.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-J.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Classification of surface settlement levels induced by TBM driving in urban areas using random forest with data-driven feature selection</article-title>. <source>Autom. Constr.</source> <volume>135</volume>, <fpage>104109</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2021.104109</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dias</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Intelligent prediction and visual optimization of surface settlement induced by earth pressure balance shield tunneling</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>154</volume>, <fpage>106138</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2024.106138</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>A modified LIME and its application to explain service supply chain forecasting</article-title>,&#x201d; in <source>Natural Language processing and Chinese computing</source> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>637</fpage>&#x2013;<lpage>644</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-030-32236-6_58</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Dynamic and explainable deep learning-based risk prediction on adjacent building induced by deep excavation</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>140</volume>, <fpage>105243</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2023.105243</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Gutierrez</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Effectiveness of predicting tunneling-induced ground settlements using machine learning methods with small datasets</article-title>. <source>J. Rock Mech. Geotech. Eng.</source> <volume>14</volume>, <fpage>1028</fpage>&#x2013;<lpage>1041</lpage>. <pub-id pub-id-type="doi">10.1016/j.jrmge.2021.08.018</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Prediction interaction responses between railway subgrade and shield tunnelling using machine learning with sparrow search algorithm</article-title>. <source>Transp. Geotech.</source> <volume>44</volume>, <fpage>101169</fpage>. <pub-id pub-id-type="doi">10.1016/j.trgeo.2023.101169</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Longo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Brcic</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cabitza</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Confalonieri</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ser</surname>
<given-names>J. D.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Explainable Artificial Intelligence (XAI) 2.0: a manifesto of open challenges and interdisciplinary research directions</article-title>. <source>Inf. Fusion</source> <volume>106</volume>, <fpage>102301</fpage>. <pub-id pub-id-type="doi">10.1016/j.inffus.2024.102301</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Love</surname>
<given-names>P. E. D.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Matthews</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Porter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Explainable artificial intelligence (XAI): precepts, models, and opportunities for research in construction</article-title>. <source>Adv. Eng. Inf.</source> <volume>57</volume>, <fpage>102024</fpage>. <pub-id pub-id-type="doi">10.1016/j.aei.2023.102024</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Erion</surname>
<given-names>G. G.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-I.</given-names>
</name>
</person-group> (<year>2019</year>). <source>Consistent individualized feature attribution for tree ensembles</source>. <pub-id pub-id-type="doi">10.48550/arXiv.1802.03888</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-I.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>A unified approach to interpreting model predictions</article-title>,&#x201d; in <source>Advances in neural information processing systems 30 (NIPS 2017)</source>. <person-group person-group-type="editor">
<name>
<surname>Guyon</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Luxburg</surname>
<given-names>U. V.</given-names>
</name>
<name>
<surname>Bengio</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wallach</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fergus</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vishwanathan</surname>
<given-names>S.</given-names>
</name>
</person-group>, (<publisher-loc>La Jolla</publisher-loc>: <publisher-name>Neural Information Processing Systems</publisher-name>).</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahdevari</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Torabi</surname>
<given-names>S. R.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Prediction of tunnel convergence using artificial neural networks</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>28</volume>, <fpage>218</fpage>&#x2013;<lpage>228</lpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2011.11.002</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahdevari</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Torabi</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Monjezi</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Application of artificial intelligence algorithms in predicting tunnel convergence to avoid TBM jamming phenomenon</article-title>. <source>Int. J. Rock Mech. Min. Sci.</source> <volume>55</volume>, <fpage>33</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijrmms.2012.06.005</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahmoodzadeh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mohammadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Daraei</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ali</surname>
<given-names>H. F. H.</given-names>
</name>
<name>
<surname>Abdullah</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Al-Salihi</surname>
<given-names>N. K.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Forecasting tunnel geology, construction time and costs using machine learning methods</article-title>. <source>Neural comput. Appl.</source> <volume>33</volume>, <fpage>321</fpage>&#x2013;<lpage>348</lpage>. <pub-id pub-id-type="doi">10.1007/s00521-020-05006-2</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mahmoodzadeh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nejati</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Mohammadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ibrahim</surname>
<given-names>H. H.</given-names>
</name>
<name>
<surname>Mohammed</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Rashidi</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Assessment of wall convergence for tunnels using machine learning techniques</article-title>. <source>Geomech. Eng.</source> <volume>31</volume>, <fpage>265</fpage>&#x2013;<lpage>279</lpage>. <pub-id pub-id-type="doi">10.12989/gae.2022.31.3.265</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirjalili</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mirjalili</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Grey Wolf optimizer</article-title>. <source>Adv. Eng. Softw.</source> <volume>69</volume>, <fpage>46</fpage>&#x2013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1016/j.advengsoft.2013.12.007</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naser</surname>
<given-names>M. Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>An engineer&#x2019;s guide to eXplainable Artificial Intelligence and Interpretable Machine Learning: navigating causality, forced goodness, and the false perception of inference</article-title>. <source>Autom. Constr.</source> <volume>129</volume>, <fpage>103821</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2021.103821</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pu</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Research on deformation prediction of tunnel surrounding rock using the model combining firefly algorithm and nonlinear auto-regressive dynamic neural network</article-title>. <source>Eng. Comput.</source> <volume>37</volume>, <fpage>1443</fpage>&#x2013;<lpage>1453</lpage>. <pub-id pub-id-type="doi">10.1007/s00366-019-00894-y</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qu</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Uncertainty-based multi-objective optimization in twin tunnel design considering fluid-solid coupling</article-title>. <source>Reliab. Eng. Syst. Safe.</source> <volume>253</volume>, <fpage>110575</fpage>. <pub-id pub-id-type="doi">10.1016/j.ress.2024.110575</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ray</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Samui</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Roy</surname>
<given-names>L. B.</given-names>
</name>
<name>
<surname>Goh</surname>
<given-names>A. T. C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Application of soft computing techniques for shallow foundation reliability in geotechnical engineering</article-title>. <source>Geosci. Front.</source> <volume>12</volume>, <fpage>375</fpage>&#x2013;<lpage>383</lpage>. <pub-id pub-id-type="doi">10.1016/j.gsf.2020.05.003</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ribeiro</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Guestrin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>&#x201c;Why should I trust you?&#x201d;: explaining the predictions of any classifier</article-title>,&#x201d; in <source>Proceedings of the 22nd ACM SIGKDD international conference on knowledge discovery and data mining</source> (<publisher-loc>New York, NY, USA</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>), <fpage>1135</fpage>&#x2013;<lpage>1144</lpage>. <pub-id pub-id-type="doi">10.1145/2939672.2939778</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheini Dashtgoli</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sadeghian</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mahboubi Ardakani</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Mohammadnezhad</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Giustiniani</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Busetti</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Predictive modeling of shallow tunnel behavior: leveraging machine learning for maximum convergence displacement estimation</article-title>. <source>Transp. Geotech.</source> <volume>47</volume>, <fpage>101284</fpage>. <pub-id pub-id-type="doi">10.1016/j.trgeo.2024.101284</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>You</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Multi-output prediction for TBM operation parameters based on stacking ensemble algorithm</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>152</volume>, <fpage>105960</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2024.105960</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Torabi-Kaveh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sarshari</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predicting convergence rate of namaklan twin tunnels using machine learning methods</article-title>. <source>Arab. J. Sci. Eng.</source> <volume>45</volume>, <fpage>3761</fpage>&#x2013;<lpage>3780</lpage>. <pub-id pub-id-type="doi">10.1007/s13369-019-04239-1</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Time series prediction of tunnel boring machine (TBM) performance during excavation using causal explainable artificial intelligence (CX-AI)</article-title>. <source>Autom. Constr.</source> <volume>147</volume>, <fpage>104730</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2022.104730</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Iura</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deformation and mechanical characteristics of tunneling in squeezing ground: a case study of the west section of the Tawarazaka Tunnel in Japan</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>109</volume>, <fpage>103697</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2020.103697</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hua</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Deep learning of rock microscopic images for intelligent lithology identification: neural network comparison and selection</article-title>. <source>J. Rock Mech. Geotech. Eng.</source> <volume>14</volume>, <fpage>1140</fpage>&#x2013;<lpage>1152</lpage>. <pub-id pub-id-type="doi">10.1016/j.jrmge.2022.05.009</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Point and interval estimation of rock mass boreability for tunnel boring machine using an improved attribute-weighted deep belief network</article-title>. <source>Acta Geotech.</source> <volume>18</volume>, <fpage>1769</fpage>&#x2013;<lpage>1791</lpage>. <pub-id pub-id-type="doi">10.1007/s11440-022-01651-0</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tiong</surname>
<given-names>R. L. K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Digital twin enabled real-time advanced control of TBM operation using deep learning methods</article-title>. <source>Autom. Constr.</source> <volume>158</volume>, <fpage>105240</fpage>. <pub-id pub-id-type="doi">10.1016/j.autcon.2023.105240</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>TBM performance prediction with Bayesian optimization and automated machine learning</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>103</volume>, <fpage>103493</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2020.103493</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Goh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction of lining response for twin tunnels constructed in anisotropic clay using machine learning techniques</article-title>. <source>Undergr. Space</source> <volume>7</volume>, <fpage>122</fpage>&#x2013;<lpage>133</lpage>. <pub-id pub-id-type="doi">10.1016/j.undsp.2020.02.007</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Data-driven intelligent prediction of TBM surrounding rock and personalized evaluation of disaster-inducing factors</article-title>. <source>Tunn. Undergr. Space Technol.</source> <volume>148</volume>, <fpage>105768</fpage>. <pub-id pub-id-type="doi">10.1016/j.tust.2024.105768</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhong</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Beluga whale optimization: a novel nature-inspired metaheuristic algorithm</article-title>. <source>Knowledge-Based Syst.</source> <volume>251</volume>, <fpage>109215</fpage>. <pub-id pub-id-type="doi">10.1016/j.knosys.2022.109215</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tao</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Machine learning models to predict the tunnel wall convergence</article-title>. <source>Transp. Geotech.</source> <volume>41</volume>, <fpage>101022</fpage>. <pub-id pub-id-type="doi">10.1016/j.trgeo.2023.101022</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Armaghani</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Yong</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predicting tunnel squeezing using support vector machine optimized by whale optimization algorithm</article-title>. <source>Acta Geotech.</source> <volume>17</volume>, <fpage>1343</fpage>&#x2013;<lpage>1366</lpage>. <pub-id pub-id-type="doi">10.1007/s11440-022-01450-7</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bian</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2023b</year>). <article-title>Prediction of maximum ground surface settlement induced by shield tunneling using XGBoost algorithm with golden-sine seagull optimization</article-title>. <source>Comput. Geotech.</source> <volume>154</volume>, <fpage>105156</fpage>. <pub-id pub-id-type="doi">10.1016/j.compgeo.2022.105156</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>