<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1409072</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2024.1409072</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Fast dynamic prediction of consequences of heavy gas leakage accidents based on machine learning</article-title>
<alt-title alt-title-type="left-running-head">Fan et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2024.1409072">10.3389/fenvs.2024.1409072</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Fan</surname>
<given-names>Chenqing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2700348/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gong</surname>
<given-names>Haixing</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2771748/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Yan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/185935/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ma</surname>
<given-names>Weichun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Yu</surname>
<given-names>Qi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Environmental Science and Engineering</institution>, <institution>Fudan University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Institute of Atmospheric Sciences</institution>, <institution>Department of Atmospheric and Oceanic Sciences</institution>, <institution>Fudan University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/893641/overview">Sushant K. Singh</ext-link>, CAIES Foundation, India</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1226406/overview">Ying Zhu</ext-link>, School of Environmental and Municipal Engineering, Xi&#x2019;an University of Architecture and Technology, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2722256/overview">Nagoor Basha Shaik</ext-link>, Chulalongkorn University, Thailand</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Qi Yu, <email>qiyu@fudan.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>23</day>
<month>07</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>12</volume>
<elocation-id>1409072</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>07</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Fan, Gong, Zhang, Ma and Yu.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Fan, Gong, Zhang, Ma and Yu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The field of emergency risk management in chemical parks has been characterized by a lack of fast, precise and dynamic prediction methods. The application of computational fluid dynamics (CFD) models, which offer the potential for dynamic and precise prediction, has been hindered by high computational costs. Therefore, taking liquid benzene as a case study, this paper combined machine learning (ML) algorithms with a CFD-based precise prediction model, to develop an ML model for fast dynamic prediction of heavy gas leakage consequences in chemical parks. Employing the CFD data as the input, the prediction models were developed using ML algorithms, refined with Bayesian optimization for parameter tuning. This study utilized PHOENICS software to establish a dynamic prediction model for the diffusion of liquid benzene leakage, validated by Burro nine experiment data. Comparative analyses of models based on five&#xa0;ML algorithms were conducted to evaluate the reliability of their predictions using both CFD standard and noisy data. The results indicated that temperature had the most significant effect on the consequences of the leakage accidents among four key factors (wind speed, temperature, leakage aperture and atmospheric stability), followed by wind speed. These factors served as input variables for ML model training. Among the models evaluated, the eXtreme Gradient Boosting (XGBoost) model showed superior performance, irrespective of the presence of noise in the data. An XGBoost-based fast prediction model was ultimately developed for predicting the consequences of liquid benzene leakage. A case analysis was conducted to validate the feasibility of the model prediction. The relative errors between the predicted and actual values of the model for acute exposure guideline level-1 (AEGL-1), AEGL-2, and AEGL-3 distances were 2.70%, 2.58%, and 0.23%, respectively. Furthermore, the XGBoost model completed the prediction in only 0.218&#xa0;s, a stark contrast to the hours necessitated by the CFD model, thus offering substantial computational time savings while maintaining high accuracy levels. This paper introduces an ML model for fast dynamic prediction of heavy gas leakage, enabling chemical parks to make more timely and accurate decisions in emergency risk management.</p>
</abstract>
<kwd-group>
<kwd>heavy gas leakage</kwd>
<kwd>machine learning</kwd>
<kwd>computational fluid dynamics</kwd>
<kwd>liquid benzene</kwd>
<kwd>analysis of accident consequences</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Big Data, AI, and the Environment</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Recent years have witnessed a marked increase in safety accidents globally, leading to significant loss of life and property damage, and severely impacting the chemical industry (<xref ref-type="bibr" rid="B21">Kang et al., 2017</xref>). These accidents are primarily attributed to shortcomings in risk management techniques, such as insufficient monitoring systems and emergency response capabilities, hindering effective risk detection and management (<xref ref-type="bibr" rid="B30">Liu and Li, 2013</xref>). In response, government regulations are escalating their safety management requirements for enterprises, with a particular focus on enhancing emergency response technologies in the chemical industry. Consequently, the advancement and integration of information technology, the Internet of Things, big data, and artificial intelligence (AI) are facilitating the development of smart chemical parks (<xref ref-type="bibr" rid="B27">Li et al., 2017</xref>). The application of modern technologies for early warnings and precise prediction of potential risks becomes imperative (<xref ref-type="bibr" rid="B52">Wang et al., 2017</xref>; <xref ref-type="bibr" rid="B7">Chai et al., 2023</xref>), which is essential for fostering the establishment and growth of smart chemical parks (<xref ref-type="bibr" rid="B21">Kang et al., 2017</xref>).</p>
<p>Model-driven methods, including the SLAB, AFTOX, ALOHA, and PHAST models, have long been prevalent for analyzing the consequences of heavy gas leakage accidents (<xref ref-type="bibr" rid="B63">Zhang et al., 2007</xref>). Multiple studies (<xref ref-type="bibr" rid="B24">Li et al., 2019</xref>; <xref ref-type="bibr" rid="B48">Terzioglu and Iskender, 2021</xref>; <xref ref-type="bibr" rid="B3">Barjoee et al., 2022</xref>; <xref ref-type="bibr" rid="B11">Cheng et al., 2022</xref>) have used these models to determine the impact ranges of different hazardous accidents. While these models are computationally convenient and time efficient, their reliance on static assumptions limits their application in the dynamic environment of smart chemical parks. More recent advancements have seen the application of models using the MATLAB language (<xref ref-type="bibr" rid="B6">Bu et al., 2022</xref>; <xref ref-type="bibr" rid="B32">Liu and Wang, 2022</xref>) and computational fluid dynamics (CFD) software (<xref ref-type="bibr" rid="B56">Wu et al., 2024</xref>; <xref ref-type="bibr" rid="B69">Zhou et al., 2024</xref>), which offer refined simulations of leakage diffusion by providing time-specific concentration distributions. Nevertheless, the complexity and extensive computational time of these numerical models (<xref ref-type="bibr" rid="B50">Wang et al., 2019</xref>) limit their application in emergency response scenarios (<xref ref-type="bibr" rid="B37">Pan and Jiang, 2004</xref>). Therefore, there is a crucial need for a prediction model that can combine dynamic simulation capabilities with fast response to fulfill the real-time prediction requirements in smart parks.</p>
<p>Data-driven methods, encompassing both statistical and machine learning (ML) models, offer robust data processing and learning capabilities for predicting pollutant concentrations (<xref ref-type="bibr" rid="B72">Zhu L. et al., 2023</xref>; <xref ref-type="bibr" rid="B16">Fu et al., 2023</xref>). These methods excel in identifying statistical patterns and providing fast and efficient predictions. While data-driven methods analyze data to predict trends from historical patterns, their assumption of linear relationships often fails to capture the complex, nonlinear dynamics present in environmental data (<xref ref-type="bibr" rid="B2">Arsic et al., 2020</xref>; <xref ref-type="bibr" rid="B33">Lu et al., 2020</xref>), leading to less accurate predictions (<xref ref-type="bibr" rid="B64">Zhang et al., 2018</xref>). In contrast, <xref ref-type="bibr" rid="B1">Ahmed et al. (2020)</xref> demonstrated that ML models were better suited to handle the complex characteristics of pollutant data, such as nonlinearity, periodicity, and seasonality. <xref ref-type="bibr" rid="B14">Fang et al. (2019)</xref> compared a multilayer perceptron (MLP) model with a linear regression model using meteorological observations, PM<sub>2.5</sub> concentrations, and air quality index (AQI), finding the MLP model to be more accurate. Furthermore, ensemble learning (EL) has also been extensively investigated for predicting pollutant concentrations. <xref ref-type="bibr" rid="B53">Wang et al. (2021)</xref> analyzed pollutant emission data and meteorological observations, including wind speed, direction, temperature, and atmospheric pressure. They compared the effectiveness of various ML algorithms&#x2014;MLP, Decision Tree (DT), Support Vector Machine (SVM), eXtreme Gradient Boosting (XGBoost), Light Gradient Boosting Machine (LightGBM), and Stacking&#x2014;in predicting the impact of air pollution in the park. Based on the prediction performance of different algorithms, the more stable Stacking model, noted for its stability, was ultimately selected to ensure reliable prediction support for enterprises. Further, <xref ref-type="bibr" rid="B71">Zhu J. Y. et al. (2023)</xref> examined models for ground-level ozone concentration prediction using LightGBM, Random Forest (RF), SVM and Recurrent Neural Network (RNN) algorithms, leveraging pollutant concentrations and meteorological observations. The LightGBM model outperformed its counterparts, with R<sup>2</sup> of 0.92. These studies underscore the importance of diverse input data, including environmental, satellite remote sensing, and time-series data, as well as meteorological variables such as temperature, wind speed, direction, and humidity. Finally, a variety of mainstream algorithms, such as MLP, DT, RF, XGBoost, and LightGBM, were used to construct and compare prediction models (<xref ref-type="bibr" rid="B22">Kang et al., 2020</xref>; <xref ref-type="bibr" rid="B9">Chen et al., 2022</xref>). Currently, scholars worldwide have focused on employing data-driven methods in AQI studies to predict pollutant concentrations (<xref ref-type="bibr" rid="B34">Ma et al., 2022</xref>; <xref ref-type="bibr" rid="B38">Peng et al., 2023</xref>). However, the application of these techniques for predicting the risks associated with accidents remains less explored, primarily due to the reliance of pollutant concentration predictions on extensive monitoring data, in contrast to the limited data for accident risk prediction.</p>
<p>To improve risk prediction and overcome the challenges of not having easy access to observational data, some researchers (<xref ref-type="bibr" rid="B44">So et al., 2010</xref>; <xref ref-type="bibr" rid="B49">Wang et al., 2015</xref>; <xref ref-type="bibr" rid="B39">Qiu et al., 2017</xref>) initially trained ML models using real-time monitoring data to predict concentrations of hazardous gas leakage. However, due to considerable measurement inaccuracies, these predictions proved suboptimal. Currently, a methodology that integrates model-driven and data-driven methods has been employed for predicting pollutant concentrations. This method employs the CFD model to generate extensive input datasets. <xref ref-type="bibr" rid="B35">Ni et al. (2020)</xref> utilized simulation data from Fluent software to develop a deep learning-based model that accurately predicted the diffusion concentrations of toxic heavy gas. <xref ref-type="bibr" rid="B20">Jiao et al. (2021)</xref> constructed a quantitative consequence prediction model based on a toxic diffusion database derived from PHAST software simulations. RF, XGBoost and Deep Neural Network (DNN) algorithms were implemented and compared to identify the best performance method for model construction. <xref ref-type="bibr" rid="B51">Wang et al. (2023)</xref> formulated a leakage model for liquid ammonia storage tanks using PHAST software, considering factors such as atmospheric stability, wind speed, and leakage aperture. Six models were compared, including linear regression, K-Nearest Neighbor (KNN), AdaBoost, DT, RF, and XGBoost. The emergency response model of liquid ammonia leakage was ultimately developed based on the XGBoost algorithm. Additionally, some researchers (<xref ref-type="bibr" rid="B49">Wang et al., 2015</xref>; <xref ref-type="bibr" rid="B40">Qiu et al., 2018</xref>) employed artificial neural networks trained on the PHAST model and utilized particle swarm optimization (PSO) algorithms to predict the diffusion of hazardous gases. These methods were investigated with the aim of overcoming the prevailing challenges of achieving both high accuracy and prediction efficiency simultaneously. Despite these advancements, existing risk prediction research has certain deficiencies. Specifically, the dynamic process of hazardous chemical evaporation is often disregarded. Therefore, in this study, the CFD model was used to develop a dynamic model for heavy gas leakage diffusion and to evaluate the impact of various factors on accident consequences. Furthermore, while standard data from numerical simulations are commonly used, real-world data typically contain noise (<xref ref-type="bibr" rid="B28">Li X. et al., 2021</xref>; <xref ref-type="bibr" rid="B31">Liu et al., 2023</xref>), challenging the accuracy of ML-based prediction models when working with such data. The reliability of ML prediction models in handling noisy data remains an area requiring further investigation. Five algorithms&#x2014;MLP, DT, RF, XGBoost, LightGBM&#x2014;were selected to develop prediction models, which were systematically evaluated for their performance using both CFD standard and noisy data. Additionally, the prediction time of these models was compared to provide faster and more accurate gas diffusion prediction with the CFD model. The objective of these advancements is to enhance environmental risk management and mitigation efforts.</p>
<p>
<xref ref-type="sec" rid="s2">Section 2</xref> of this paper introduces the scenario and simulation scheme for a heavy gas leakage accident, the selected ML algorithms and the modelling process, and confirms the reliability of the CFD model in simulating heavy gas leakage. <xref ref-type="sec" rid="s3">Section 3</xref> analyzes the influencing factors, correlation between variables and diffusion mechanism of the consequences of the leakage accidents. It evaluates the ML models based on standard data and noisy data respectively, and identifies the most effective model for predictive analysis. <xref ref-type="sec" rid="s4">Section 4</xref> summarizes the research and the shortcomings of this study.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Heavy gas leakage scenarios and simulation schemes</title>
<sec id="s2-1-1">
<title>2.1.1 Characteristics and hazardous of benzene</title>
<p>Benzene at ambient temperature is a colorless and transparent fluid characterized by a density of approximately 880&#xa0;kg/m<sup>3</sup>. The saturated vapor pressure of liquid benzene demonstrates variation across different temperatures (<xref ref-type="fig" rid="F1">Figure 1</xref>). Prolonged or high levels of exposure to liquid benzene can adversely affect health. A leakage resulting in the inhalation of benzene vapor can lead to symptoms such as headache, dizziness, drowsiness, causing severe neurological and liver damage, and being potentially fatal. Therefore, this paper aims to investigate the phenomenon of benzene leakage by developing a prediction model for the concentration and diffusion of heavy gas leakage.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The saturated vapor pressure of liquid benzene varies with temperature.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g001.tif"/>
</fig>
</sec>
<sec id="s2-1-2">
<title>2.1.2 Classification of hazardous distances</title>
<p>The standard concentrations of Acute Exposure Guideline Levels (AEGLs), established by the US National Advisory Committee (NAC), were utilized to determine hazardous distances. AEGLs apply to the adverse effects associated with short-duration and sudden-onset chemical leakages (<xref ref-type="bibr" rid="B66">Zhao and Chen, 2014</xref>). AEGLs are categorized into three levels: AEGL-1, AEGL-2 and AEGL-3. Each level corresponds to a specific level of acute toxicity. Under these standards, AEGL-1, AEGL-2 and AEGL-3 thresholds, corresponding to the 10-min liquid benzene leakage, are 420&#xa0;mg/m<sup>3</sup>, 6,500&#xa0;mg/m<sup>3</sup> and 31,000&#xa0;mg/m<sup>3</sup>, respectively. The concentration limits associated with specific injury symptoms are outlined in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>AEGLs for the 10-min leakage of liquid benzene.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Classification</th>
<th align="center">Concentration limit (mg/m<sup>3</sup>)</th>
<th align="center">Injury symptoms</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">AEGL-1</td>
<td align="center">420</td>
<td align="center">Obvious discomfort, anger or certain symptoms</td>
</tr>
<tr>
<td align="center">AEGL-2</td>
<td align="center">6,500</td>
<td align="center">Irreversible or serious, long-lasting adverse effects</td>
</tr>
<tr>
<td align="center">AEGL-3</td>
<td align="center">31,000</td>
<td align="center">Could be life threatening or even fatal</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-1-3">
<title>2.1.3 Assumptions for accident scenario</title>
<p>This study examined an accident scenario involving a liquid benzene storage tank located within a chemical park. The tank, characterized by its horizontal orientation and a capacity of 135&#xa0;m<sup>3</sup>, was maintained under ambient temperature and pressure conditions. The tank suffered a rupture due to the impact of an external object, forming a circular breach approximately 0.5&#xa0;m above the ground, encircled by a 35&#xa0;m radius cofferdam. Additionally, the internal and external factors that influence tank leakage are crucial to the study of gas leakage diffusion. <xref ref-type="bibr" rid="B70">Zhu et al. (2009)</xref> and <xref ref-type="bibr" rid="B45">Sun and Guo (2010)</xref> have discussed the significant effects of wind speed and atmospheric stability on gas diffusion. A summary of the current status of domestic and international research on leakage diffusion has been provided, and it has been demonstrated that leakage aperture, temperature and wind speed were important factors affecting gas diffusion (<xref ref-type="bibr" rid="B68">Zhou et al., 2012</xref>). Furthermore, <xref ref-type="bibr" rid="B51">Wang et al. (2023)</xref> constructed a liquid ammonia leakage prediction model based on environmental factors such as atmospheric stability, wind speed, and leakage aperture. Therefore, a range of values was selected for four factors: leakage aperture, wind speed, temperature, and atmospheric stability. These values are presented in <xref ref-type="sec" rid="s10">Supplementary Table S2</xref>. The apertures considered were 100&#xa0;mm 150&#xa0;mm and 200&#xa0;mm; wind speed ranged from 1&#xa0;m/s to 6&#xa0;m/s in 1&#xa0;m/s increments. Temperatures were set at 20&#xb0;C, 25&#xb0;C, 30&#xb0;C, 40&#xb0;C and 50&#xb0;C. Atmospheric stabilities were categorized as unstable, neutral and stable. The duration of leakage was set at 10&#xa0;min. In total, 270 different scenarios were simulated, with the fundamental parameters of the leakage tank detailed in <xref ref-type="sec" rid="s10">Supplementary Table S3</xref>.</p>
<p>The leakage rate of liquid benzene after a leakage is calculated using the Bernoulli Eq. <xref ref-type="disp-formula" rid="e1">1</xref> (<xref ref-type="bibr" rid="B15">Fu, 2008</xref>):<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>d</mml:mi>
</mml:msub>
<mml:mi>A</mml:mi>
<mml:mi>&#x3c1;</mml:mi>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mfrac>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mi>g</mml:mi>
<mml:mi>h</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <inline-formula id="inf1">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the rate of liquid leakage, kg/s. <inline-formula id="inf2">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>d</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, the liquid leakage coefficient, is taken as 0.65. <inline-formula id="inf3">
<mml:math id="m4">
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> denotes the area of rupture, m<sup>2</sup>. <inline-formula id="inf4">
<mml:math id="m5">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> signifies the density of the liquid, kg/m<sup>3</sup>. <inline-formula id="inf5">
<mml:math id="m6">
<mml:mrow>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the internal and ambient pressures, respectively, Pa. <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> represents the gravity acceleration at 9.81&#xa0;m/s<sup>2</sup>. <inline-formula id="inf8">
<mml:math id="m9">
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> indicates the height of the liquid level above the rupture, m. Given that liquid benzene was stored at ambient conditions, where both the storage and ambient temperatures remained below its boiling point, flash and heat evaporation processes were precluded. This scenario led to the formation of a liquid pool on the ground. The subsequent evaporation of this pool was primarily driven by the air movement over its surface, and the mass evaporation rate is thus calculated as:<disp-formula id="e2">
<mml:math id="m10">
<mml:mrow>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>v</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>p</mml:mi>
<mml:mfrac>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:msup>
<mml:mi>u</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:msup>
<mml:msup>
<mml:mi>r</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mn>4</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>where <inline-formula id="inf9">
<mml:math id="m11">
<mml:mrow>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>v</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denotes the mass evaporation rate, kg/s. <inline-formula id="inf10">
<mml:math id="m12">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf11">
<mml:math id="m13">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> represent the atmospheric stability coefficients. <inline-formula id="inf12">
<mml:math id="m14">
<mml:mrow>
<mml:mi>p</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> specifies the vapor pressure at the surface of the liquid, Pa. <inline-formula id="inf13">
<mml:math id="m15">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the molar mass of the chemical, kg/mol. <inline-formula id="inf14">
<mml:math id="m16">
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> stands for the gas constant, J/(mol&#xb7;k). <inline-formula id="inf15">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> indicates the ambient temperature, K. <inline-formula id="inf16">
<mml:math id="m18">
<mml:mrow>
<mml:mi>u</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> refers to the ambient wind speed, m/s. <inline-formula id="inf17">
<mml:math id="m19">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the radius of the liquid pool, m. The rate of mass evaporation varied dynamically with the radius of the liquid pool. In cases of the continuous leakage, the dynamics radius of the liquid pool, <inline-formula id="inf18">
<mml:math id="m20">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, as a function of time <inline-formula id="inf19">
<mml:math id="m21">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, adhered to the following Eq. <xref ref-type="disp-formula" rid="e3">3</xref> (<xref ref-type="bibr" rid="B36">Nielsen et al., 1995</xref>). Ultimately, a CFD-based dynamic diffusion model of liquid benzene leakage has been developed. This model calculated the radius of the liquid pool and the corresponding evaporation rate per second throughout the 10-min leakage period under various environmental conditions.<disp-formula id="e3">
<mml:math id="m22">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mroot>
<mml:mfrac>
<mml:mrow>
<mml:mn>9</mml:mn>
<mml:mi>&#x3c0;</mml:mi>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>32</mml:mn>
<mml:mi>g</mml:mi>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>L</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mn>3</mml:mn>
</mml:mroot>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
</p>
</sec>
</sec>
<sec id="s2-2">
<title>2.2 Machine learning (ML) algorithms</title>
<sec id="s2-2-1">
<title>2.2.1 Introduction to ML algorithms</title>
<p>
<list list-type="simple">
<list-item>
<p>(1) Multi-layer perceptron (MLP)</p>
</list-item>
</list>
</p>
<p>The Multi-Layer Perceptron (MLP), a form of feed-forward neural network, encompasses two main processes: forward and back propagation (<xref ref-type="bibr" rid="B13">Ehteram et al., 2022</xref>). During forward propagation, the input data is processed through the layers of network, guided by weights and biases, to generate the predicted output of the model layer by layer. Conversely, back propagation adjusts these parameters via gradient descent by computing the gradient of the loss function with respect to the weights and biases, thus refining predictions to more closely match the true values.<list list-type="simple">
<list-item>
<p>(2) Decision tree (DT)</p>
</list-item>
</list>
</p>
<p>The Decision Tree (DT), a tree-based methodology, can effectively capture nonlinear relationships and clearly illustrate the decision-making process of each feature within a structured tree format. Nonetheless, the DT model exhibits a high sensitivity to noisy data, which can be mitigated by employing a Random Forest model, which mitigates the impact of noise (<xref ref-type="bibr" rid="B60">Yu et al., 2019</xref>).<list list-type="simple">
<list-item>
<p>(3) Random Forest (RF)</p>
</list-item>
</list>
</p>
<p>The Random Forest (RF) model enhances efficacy and robustness by integrating multiple DTs into a strong evaluator. It operates by having each decision tree independently predict on the input data, with the final prediction being derived through a method of weighted averaging or voting, as represented by the Eq. <xref ref-type="disp-formula" rid="e4">4</xref> <xref ref-type="bibr" rid="B4">Breiman (2001)</xref>:<disp-formula id="e4">
<mml:math id="m23">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>where <inline-formula id="inf20">
<mml:math id="m24">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents the aggregate prediction from each simple decision tree <inline-formula id="inf21">
<mml:math id="m25">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. In constructing each decision tree, the RF model mitigates noise and overfits by employing bootstrap sampling, which means drawing from the training set with replacement (<xref ref-type="bibr" rid="B55">Wu and Zhao, 2013</xref>).<list list-type="simple">
<list-item>
<p>(4) eXtreme gradient boosting (XGBoost)</p>
</list-item>
</list>
</p>
<p>The eXtreme Gradient Boosting (XGBoost) model represents an advanced implementation of gradient boosting algorithms and stands as a noteworthy component in the EL models, playing a pivotal role in ensemble learning (EL) models due to its efficacy in capturing complex and nonlinear interactions (<xref ref-type="bibr" rid="B10">Chen and Guestrin, 2016</xref>). The core of the XGBoost model is a gradient boosting framework that sequentially constructs an ensemble of weak learners, typically decision trees, to minimize a differentiable loss function. What sets XGBoost apart is its efficient handling of sparse data and missing values, an aspect crucial for robustness in real-world data applications. It incorporates a sparsity-aware algorithm for handling missing data and employs a weighted quantile sketch for efficient approximate tree learning. To enhance generalization and mitigate overfitting, the XGBoost model integrates specific regularization mechanisms, including L1 (Lasso regression) and L2 (Ridge regression) penalties. These regularization terms add a penalization component to the objective function, effectively controlling the complexity of the model. The main formulas for the XGBoost model are as follows Eqs <xref ref-type="disp-formula" rid="e5">5</xref>&#x2013;<xref ref-type="disp-formula" rid="e7">7</xref>:<disp-formula id="e5">
<mml:math id="m26">
<mml:mrow>
<mml:mi>O</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>j</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi mathvariant="normal">&#x398;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>K</mml:mi>
</mml:msubsup>
<mml:mi mathvariant="normal">&#x3a9;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
<disp-formula id="e6">
<mml:math id="m27">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>
<disp-formula id="e7">
<mml:math id="m28">
<mml:mrow>
<mml:mi mathvariant="normal">&#x3a9;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3b3;</mml:mi>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mi>&#x3b1;</mml:mi>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mi>&#x3bb;</mml:mi>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:munderover>
</mml:mstyle>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>In formula <xref ref-type="disp-formula" rid="e5">(5)</xref>, the first term, <inline-formula id="inf22">
<mml:math id="m29">
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> aggregates the losses computed over all <inline-formula id="inf23">
<mml:math id="m30">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> samples, where <inline-formula id="inf24">
<mml:math id="m31">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> measures the discrepancy between the predicted <inline-formula id="inf25">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the actual <inline-formula id="inf26">
<mml:math id="m33">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> values, which is defined here as the square of the residuals. The second term, <inline-formula id="inf27">
<mml:math id="m34">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>K</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:mrow>
<mml:mi mathvariant="normal">&#x3a9;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, is the sum of regularization terms for <inline-formula id="inf28">
<mml:math id="m35">
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> weak learners, typically decision trees, to control the complexity of the model. The term <inline-formula id="inf29">
<mml:math id="m36">
<mml:mrow>
<mml:mi>&#x3b3;</mml:mi>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> adds a penalty proportional to the number of leaf nodes <inline-formula id="inf30">
<mml:math id="m37">
<mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> in the tree <inline-formula id="inf31">
<mml:math id="m38">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, with <inline-formula id="inf32">
<mml:math id="m39">
<mml:mrow>
<mml:mi>&#x3b3;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> serving as a non-negative regularization parameter. This term restricts tree growth and aids in mitigating overfitting by penalizing excessive complexity. The expression <inline-formula id="inf33">
<mml:math id="m40">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mi>&#x3b1;</mml:mi>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:msubsup>
</mml:mstyle>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> denotes the L1 regularization (Lasso), which imposes a penalty on the absolute values of the leaf weights <inline-formula id="inf34">
<mml:math id="m41">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. This promotes sparsity in the leaf weights, potentially reducing some to zero, thereby facilitating feature selection within the trees. Meanwhile, <inline-formula id="inf35">
<mml:math id="m42">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mi>&#x3bb;</mml:mi>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:msubsup>
</mml:mstyle>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> signifies the L2 regularization on the leaf weights <inline-formula id="inf36">
<mml:math id="m43">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of the tree, with <inline-formula id="inf37">
<mml:math id="m44">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> serving as the regularization coefficient.<list list-type="simple">
<list-item>
<p>(5) Light Gradient Boosting Machine (LightGBM)</p>
</list-item>
</list>
</p>
<p>The Light Gradient Boosting Machine (LightGBM) model, also an ML algorithm based on gradient boosting trees (<xref ref-type="bibr" rid="B71">Zhu J. Y. et al., 2023</xref>), employs an innovative histogram-based learning method that not only reduces computational complexity but also significantly enhances training efficiency on large datasets (<xref ref-type="bibr" rid="B18">Gao et al., 2020</xref>). By iteratively learning from gradient boosting trees, the LightGBM model consistently improves model performance, exhibiting robust generalization capabilities and effectiveness, particularly in addressing regression problems (<xref ref-type="bibr" rid="B29">Li Z. et al., 2021</xref>; <xref ref-type="bibr" rid="B54">Wei et al., 2021</xref>).</p>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Data pre-processing and model setting</title>
<p>The typical workflow for applying ML models encompasses several critical steps (<xref ref-type="bibr" rid="B5">Bruha, 2000</xref>): data collection, data preprocessing, feature correlation analysis, parameter tuning, model training and validation.</p>
<p>This study generated various accident scenario hypotheses using the CFD model, with the CFD simulation data serving as the training datasets. For the accident scenario outlined in <xref ref-type="sec" rid="s2-1-3">section 2.1.3</xref>, the CFD model was employed to simulate 270 different working conditions. This simulation generated concentration data at various downwind distances at 10-s intervals, culminating in a total of 515,160 datasets. The variables included in the analysis were time, leakage aperture, wind speed, temperature, atmospheric stability and downwind distance, with the concentration outcome (C1) serving as the target variable. These variables were normalized using Z-Score standardization. Atmospheric stability, a categorical variable, was converted into a numerical format using One-Hot encoding. Pearson correlation coefficient, designed by the letter &#x2018;<inline-formula id="inf38">
<mml:math id="m45">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>&#x2019;, was employed to quantify the linear relationships between the variables. The correlation coefficient between each pair of variables was calculated using the following formula <xref ref-type="disp-formula" rid="e8">(8)</xref> (<xref ref-type="bibr" rid="B43">Shaik et al., 2024</xref>). To assess the model performance, a subset featuring specific conditions&#x2014;200&#xa0;mm leakage aperture, 6&#xa0;m/s wind speed, 50&#xb0;C temperature, and stable atmospheric stability&#x2014;was selected for validation. The remaining data was divided into an 80% training set and a 20% testing set. Moreover, Bayesian optimization and 10-fold cross-validation were applied for parameter tuning and model training. <xref ref-type="table" rid="T2">Table 2</xref> displays the hyperparameter range domains for each model and the optimization results achieved by the algorithm.<disp-formula id="e8">
<mml:math id="m46">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>where <inline-formula id="inf39">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the correlation coefficient. <inline-formula id="inf40">
<mml:math id="m48">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf41">
<mml:math id="m49">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denote the values of the two variables. <inline-formula id="inf42">
<mml:math id="m50">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf43">
<mml:math id="m51">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> represent the means of the two variables. <inline-formula id="inf44">
<mml:math id="m52">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> signifies the number of samples.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Hyperparameter range domains of each model and results using Bayesian optimization.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">ML model</th>
<th align="center">Hyperparameter</th>
<th align="center">Range domains</th>
<th align="center">Optimal value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="center">MLP</td>
<td align="center">Hidden layer</td>
<td align="center">[50,600]</td>
<td align="center">511</td>
</tr>
<tr>
<td align="center">Learning rate</td>
<td align="center">[0.001,0.1]</td>
<td align="center">0.088</td>
</tr>
<tr>
<td rowspan="2" align="center">DT</td>
<td align="center">Maximum tree depth</td>
<td align="center">[1,30]</td>
<td align="center">25</td>
</tr>
<tr>
<td align="center">Minimum sample size of nodes</td>
<td align="center">[1,30]</td>
<td align="center">6</td>
</tr>
<tr>
<td rowspan="3" align="center">RF</td>
<td align="center">N estimator</td>
<td align="center">[10,400]</td>
<td align="center">243</td>
</tr>
<tr>
<td align="center">Maximum tree depth</td>
<td align="center">[3,25]</td>
<td align="center">25</td>
</tr>
<tr>
<td align="center">Minimum sample size of nodes</td>
<td align="center">[1,30]</td>
<td align="center">7</td>
</tr>
<tr>
<td rowspan="6" align="center">XGBoost</td>
<td align="center">N estimator</td>
<td align="center">[100,300]</td>
<td align="center">287</td>
</tr>
<tr>
<td align="center">Maximum tree depth</td>
<td align="center">[4,30]</td>
<td align="center">15</td>
</tr>
<tr>
<td align="center">Minimum sample size of nodes</td>
<td align="center">[2,30]</td>
<td align="center">22</td>
</tr>
<tr>
<td align="center">Gamma</td>
<td align="center">[0,5]</td>
<td align="center">1</td>
</tr>
<tr>
<td align="center">Alpha</td>
<td align="center">[0,5]</td>
<td align="center">1</td>
</tr>
<tr>
<td align="center">Lamba</td>
<td align="center">[0,5]</td>
<td align="center">2</td>
</tr>
<tr>
<td rowspan="3" align="center">LightGBM</td>
<td align="center">N estimator</td>
<td align="center">[100,300]</td>
<td align="center">161</td>
</tr>
<tr>
<td align="center">Maximum tree depth</td>
<td align="center">[4,30]</td>
<td align="center">27</td>
</tr>
<tr>
<td align="center">Learning rate</td>
<td align="center">[0.0001,10]</td>
<td align="center">0.58</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To assess prediction accuracy for diffusion concentration within the ML algorithms, this study employed four principal metrics: the root mean square error (RMSE), mean absolute error (MAE), coefficient of determination (R<sup>2</sup>) and index of agreement (IOA). The formulas are as follows Eqs <xref ref-type="disp-formula" rid="e9">9</xref>&#x2013;<xref ref-type="disp-formula" rid="e12">12</xref> (<xref ref-type="bibr" rid="B41">Shaik et al., 2022</xref>; <xref ref-type="bibr" rid="B42">Shaik et al., 2023</xref>; <xref ref-type="bibr" rid="B43">Shaik et al., 2024</xref>):<disp-formula id="e9">
<mml:math id="m53">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
<label>(9)</label>
</disp-formula>
<disp-formula id="e10">
<mml:math id="m54">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="&#x7c;">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(10)</label>
</disp-formula>
<disp-formula id="e11">
<mml:math id="m55">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(11)</label>
</disp-formula>
<disp-formula id="e12">
<mml:math id="m56">
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>A</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
</mml:mstyle>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close="|" separators="&#x7c;">
<mml:mrow>
<mml:mo>(</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
<mml:mrow>
<mml:mfenced open="|" close="" separators="&#x7c;">
<mml:mrow>
<mml:mo>&#x2b;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mfenced open="" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="" close="|" separators="&#x7c;">
<mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(12)</label>
</disp-formula>where <inline-formula id="inf45">
<mml:math id="m57">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the value predicted by the ML model. <inline-formula id="inf46">
<mml:math id="m58">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denotes the value simulated by the CFD model. <inline-formula id="inf47">
<mml:math id="m59">
<mml:mrow>
<mml:mover accent="true">
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf48">
<mml:math id="m60">
<mml:mrow>
<mml:mover accent="true">
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> correspond to the mean of ML predicted values and CFD simulated values, respectively, with <inline-formula id="inf49">
<mml:math id="m61">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> signifying the sample size.</p>
</sec>
</sec>
<sec id="s2-3">
<title>2.3 CFD modelling and model validation</title>
<sec id="s2-3-1">
<title>2.3.1 Selection of validation dataset</title>
<p>Before providing accurate sample data for ML models, it is necessary to validate the reliability of the CFD model in simulating the diffusion of heavy gas leakage. The purpose of this study is to validate the efficacy of the PHOENICS software in simulating heavy gas leakage, specifically through the application of the renowned Burro series experiments. These experiments took place in a circular water tank, measuring 58&#xa0;m in diameter and 1&#xa0;m in depth, where the liquefied natural gas (LNG) was released at a temperature of &#x2212;164&#xb0;C (<xref ref-type="bibr" rid="B23">Koopman et al., 1982</xref>). The significant temperature difference between the released LNG and surrounding environment facilitated the rapid vaporization of LNG, resulting in the formation of a cold and heavy gas cloud, approximately 1.5 times heavier than air (<xref ref-type="bibr" rid="B59">Yu et al., 2018</xref>). Methane concentrations were measured using sensors located at distances of 58&#xa0;m, 140&#xa0;m, 400&#xa0;m and 800&#xa0;m downwind from the release point. The initial conditions of the Burro series experiments are comprehensively outlined in <xref ref-type="sec" rid="s10">Supplementary Table S4</xref>.</p>
</sec>
<sec id="s2-3-2">
<title>2.3.2 CFD modelling</title>
<p>
<list list-type="simple">
<list-item>
<p>(1) Physical model and governing equations</p>
</list-item>
</list>
</p>
<p>In this study, the computational domain was defined as 1,000&#xa0;m &#xd7; 300&#xa0;m &#xd7; 50&#xa0;m. To enhance grid structure efficiency and minimize computational time, the domain was segmented into 200 &#xd7; 100 &#xd7; 25 using a gradient grid. The mesh independence analysis ensured that the CFD data remained consistent as the mesh size varied, as detailed in the <xref ref-type="sec" rid="s10">Supplementary Text S1</xref>. <xref ref-type="fig" rid="F2">Figure 2</xref> illustrates the configuration of the detailed domain and grid setup within the CFD model. These modeling parameters were meticulously chosen to accurately simulate the heavy gas leakage scenario, laying a robust groundwork for subsequent analysis.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The configuration of the CFD model, focusing on: <bold>(A)</bold> model setting on the X-Z plane and <bold>(B)</bold> model setting on the Y-Z plane.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g002.tif"/>
</fig>
<p>In this study, the <italic>Core</italic> module of the PHOENICS 6.0 software was used as the simulation platform. The turbulence model chosen was the widely used standard k-&#x3b5; model within PHOENICS, with the specific equations given by Eqs <xref ref-type="disp-formula" rid="e13">13</xref>, <xref ref-type="disp-formula" rid="e14">14</xref>:<disp-formula id="e13">
<mml:math id="m62">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2202;</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="&#x7c;">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3c1;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:math>
<label>(13)</label>
</disp-formula>
<disp-formula id="e14">
<mml:math id="m63">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mi>&#x2202;</mml:mi>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="&#x7c;">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="&#x7c;">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x2202;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2202;</mml:mo>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfrac>
<mml:mrow>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mi>&#x3c1;</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>&#x3b5;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(14)</label>
</disp-formula>where <inline-formula id="inf50">
<mml:math id="m64">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denotes the turbulent viscosity, kg/(m&#xb7;s). <inline-formula id="inf51">
<mml:math id="m65">
<mml:mrow>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> indicates the velocity component in the <inline-formula id="inf52">
<mml:math id="m66">
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-direction, m/s, and <inline-formula id="inf53">
<mml:math id="m67">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> corresponds to the spatial coordinate in that direction, m. <inline-formula id="inf54">
<mml:math id="m68">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the molecular viscosity, kg/(m&#xb7;s). <inline-formula id="inf55">
<mml:math id="m69">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf56">
<mml:math id="m70">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the Prandtl numbers associated with turbulence kinetic energy <inline-formula id="inf57">
<mml:math id="m71">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and dissipation rate <inline-formula id="inf58">
<mml:math id="m72">
<mml:mrow>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, respectively, with their values set at <inline-formula id="inf59">
<mml:math id="m73">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 1.0 and <inline-formula id="inf60">
<mml:math id="m74">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>&#x3b5;</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; 1.3. <inline-formula id="inf61">
<mml:math id="m75">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the turbulence kinetic energy production term generated by the mean velocity gradient, m<sup>2</sup>/s<sup>3</sup>. <inline-formula id="inf62">
<mml:math id="m76">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf63">
<mml:math id="m77">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>&#x3b5;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represent empirical constants taken as 1.44 and 1.92, respectively.<list list-type="simple">
<list-item>
<p>(2) Physical Properties</p>
</list-item>
</list>
</p>
<p>In the <italic>Properties</italic> section, set the ambient temperature to 35.4&#xb0;C and the atmospheric pressure to 101,325&#xa0;Pa. The <italic>Inverse Linear</italic> option was selected for the density setting to configure the density of the methane-air mixture, thereby accurately simulating the settling process of heavy gas, incorporating the impact of gravity was vital. Additionally, activate the gravity option <italic>Density Difference</italic> and set the gravitational acceleration to &#x2212;9.81&#xa0;m/s<sup>2</sup> in the <italic>Z</italic> direction.<list list-type="simple">
<list-item>
<p>(3) Boundary condition settings</p>
</list-item>
</list>
</p>
<p>The inlet boundary conditions of the model utilized the <italic>Wind</italic> property to define wind speed and direction. The index method ensured an accurate representation of the vertical gradient change in wind speed (<xref ref-type="bibr" rid="B26">Li and Tian, 2011</xref>). Given that the Burro series experiments were conducted in an open area without obvious obstacles, the effective roughness height in this study was set at 0.0002&#xa0;m, and the wind profile index was chosen as 0.16.<list list-type="simple">
<list-item>
<p>(4) Inlet settings</p>
</list-item>
</list>
</p>
<p>A series of <italic>Inlet</italic> objects were selected to simulate the evaporation rates from the liquid pool. The leakage scenario was simplified to model the complete evaporation of LNG from a 58&#xa0;m diameter liquid pool. The evaporation rate was approximated as the leakage rate, with the <italic>Mass Flow</italic> of the <italic>Inlet</italic> object set to 24.2&#xa0;m<sup>3</sup>/min. Additionally, the solver variable C1 was added into the <italic>Models</italic> section, assigning a value of 1.0. The results of C1 were extracted after the completion of simulation and converted to the concentration of methane (CH<sub>4</sub>) using calculation formula <xref ref-type="disp-formula" rid="e15">(15)</xref>:<disp-formula id="e15">
<mml:math id="m78">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mn>4</mml:mn>
</mml:msub>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>C</mml:mi>
<mml:mn>1</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>&#x3c1;</mml:mi>
<mml:mi>a</mml:mi>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:msup>
<mml:mn>10</mml:mn>
<mml:mn>6</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(15)</label>
</disp-formula>where <inline-formula id="inf64">
<mml:math id="m79">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mn>4</mml:mn>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the concentration of CH<sub>4</sub>, mg/m<sup>3</sup>.</p>
</sec>
<sec id="s2-3-3">
<title>2.3.3 CFD simulation validation</title>
<p>The Burro nine experiment was selected to evaluate the accuracy of the CFD model in simulating the diffusion of heavy gas leakage. <xref ref-type="fig" rid="F3">Figure 3</xref> illustrates the concentration distribution of the gas cloud at T &#x3d; 80&#xa0;s for the Burro nine experiment across two planes. <xref ref-type="fig" rid="F3">Figure 3A</xref> shows the Y-Z plane at a distance of 140&#xa0;m downwind, where the observed gas cloud extended approximately 60&#xa0;m to the left and 28&#xa0;m to the right. Conversely, the CFD simulation showed an extension of about 48&#xa0;m on both sides, revealing a minor discrepancy between the simulated and observed spreads. This discrepancy is likely due to a deviation between the actual and simulated wind directions, as well as the uneven terrain at 140&#xa0;m. This uneven terrain could account for the slightly elevated height of the gas cloud on the northern side compared to the southern side. <xref ref-type="fig" rid="F3">Figure 3B</xref> illustrates to the X-Y plane at a height of Z &#x3d; 1&#xa0;m, where the simulated range of CFD is slightly narrower than the actual observed diffusion range. The violent phase change reaction occurring near the leakage source affected the concentration sensor at 57&#xa0;m, resulting in a discontinuity in the 5% concentration contour. <xref ref-type="bibr" rid="B65">Zhang et al. (2015)</xref> used the FEM3 and CFD models to validate the Burro nine experiment, simulating the gas cloud extent on the Y-Z plane at a downwind distance of 140&#xa0;m to be 53&#xa0;m and 75&#xa0;m, respectively. The farthest distances by the CFD model for volume concentrations of 5%, 2%, and 1% on the X-Y plane were about 190&#xa0;m, 368&#xa0;m, and 500&#xa0;m. <xref ref-type="fig" rid="F3">Figures 3A,B</xref> demonstrate that the gas cloud extent simulated by the CFD model adopted in this paper is reasonable. Additionally, the simulated diffusion ranges being narrower than observed could also be attributed to the instability of the wind speed. Despite these differences, the overall diffusion ranges of the gas cloud were consistent with the actual experimental results, accurately reflecting the diffusion dynamics of the heavy gas leakage.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Distribution of methane concentrations across various planes during the Burro nine experiment: <bold>(A)</bold> the distribution on the Y-Z plane at a distance of 140&#xa0;m downwind at T &#x3d; 80&#xa0;s, and <bold>(B)</bold> the distribution on the X-Y plane at a height of 1&#xa0;m, also at T &#x3d; 80&#xa0;s.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g003.tif"/>
</fig>
<p>It specifically depicts the methane concentration over time at a distance of 140&#xa0;m downwind in <xref ref-type="fig" rid="F4">Figure 4A</xref>, with the observed peak concentration reaching 9.6%. The CFD simulation peaking at 9.62%, resulted in a minimal relative error of 0.2%. While at a distance of 400&#xa0;m downwind, the observed maximum concentration was 3.96%, compared to the CFD simulation&#x2019;s maximum value of 3.23%, leading to a relative error of 18.43% (<xref ref-type="fig" rid="F4">Figure 4B</xref>). <xref ref-type="bibr" rid="B45">Sun and Guo (2010)</xref> used the DEGADIS model to validate the Burro nine experiment, and the relative errors of the simulation concentrations at downwind distances of 140&#xa0;m and 400&#xa0;m were 44.7% and 16.49%, respectively. <xref ref-type="bibr" rid="B46">Sun et al. (2013)</xref> simulated the maximum concentrations at different downwind distances of the Burro eight experiment using the Fluent software, with an average relative error of 19.62%. This demonstrates that the CFD model utilized in this study effectively enhanced the precision of concentration prediction, maintaining relative errors within permissible limits. Therefore, the CFD model is considered to accurately capture the trends of the observed methane concentrations, although temporal variations are present. Such variations may arise from the inconsistent evaporation rates of LNG leakage and the dynamics size of the evaporating liquid pool, which, if assumed constant in the model, will introduce validation uncertainties. <xref ref-type="fig" rid="F4">Figures 4C,D</xref> reveal that the simulated heights of the air clouds with varying concentrations at a distance of 400&#xa0;m downwind slightly exceeded the actual measurements, yet their lateral extents remained broadly consistent. The overall trend alignment and acceptable error margins confirm the CFD simulation&#x2019;s efficacy for subsequent research.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Methane concentration values at different downwind distances for the Burro nine experiment. <bold>(A)</bold> and <bold>(B)</bold> are plots of methane concentration values with time at 140&#xa0;m and 400&#xa0;m downwind distance, respectively. <bold>(C)</bold> and <bold>(D)</bold> are the concentration distributions of experimental and CFD simulated values at T &#x3d; 120&#xa0;s and downwind distance of 400&#xa0;m, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g004.tif"/>
</fig>
</sec>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>3 Results and discussion</title>
<sec id="s3-1">
<title>3.1 Analysis of factors affecting benzene leakage accidents consequences</title>
<sec id="s3-1-1">
<title>3.1.1 Dynamic characteristics of liquid pool radius and evaporation rate</title>
<p>Upon the leakage of benzene, its high boiling point resulted in the formation of a liquid pool on the ground. The evaporation of the liquid pool was facilitated by the airflow over the pool surface, with both the radius of the pool and the evaporation rate changing dynamically. Before exploring the impacts of various factors on the diffusion distances of benzene, this study initially analyzed the influences of four factors on the dynamic changes of the radius and evaporation rate of the liquid pool. The results are presented in <xref ref-type="fig" rid="F5">Figure 5</xref>, which displays the dynamic changes of the liquid pool radius and evaporation rate under different wind speeds, temperatures, leakage apertures and atmospheric stabilities, labelled A-L respectively.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Variation patterns of liquid pool radius and evaporation rate with time under different scenarios, where <bold>(A)</bold> and <bold>(B)</bold>, <bold>(C)</bold> and <bold>(D)</bold>, <bold>(E)</bold> and <bold>(F)</bold>, and <bold>(G)</bold> and <bold>(H)</bold> denote the dynamic changes of liquid pool radius and evaporation rate under different wind speeds, temperatures, leakage apertures, and atmospheric stabilities, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g005.tif"/>
</fig>
<p>An increase in wind speed from 1&#xa0;m/s to 6&#xa0;m/s extended the duration required for the liquid pool to achieve its maximum radius from 145&#xa0;s to 163&#xa0;s, currently elevating the evaporation rate from 7.36&#xa0;kg/s to 31.88&#xa0;kg/s (<xref ref-type="fig" rid="F5">Figures 5A,B</xref>). This indicates that higher wind speeds not only delay the attainment of the maximum radius of the liquid pool but also substantially enhance the evaporation rate. Such an increase accelerates the volatility and diffusion rate of benzene, thereby enlarging the potential hazardous ranges. Furthermore, a temperature increase from 20&#xb0;C to 50&#xb0;C similarly impacted these dynamics, lengthening the time to reach the maximum radius from 144&#xa0;s to 163&#xa0;s, while elevating the evaporation rate from 6.03&#xa0;kg/s to 31.88&#xa0;kg/s (<xref ref-type="fig" rid="F5">Figures 5C,D</xref>). The rise in temperature not only accelerated the evaporation rate but also slowed down the growth rate of the radius of the liquid pool, prolonging the time to reach its maximum. Variations in the leakage aperture slightly adjusted the time for the liquid pool to achieve its maximum radius from 159&#xa0;s to 163&#xa0;s. The evaporation rate attained a consistent peak of 31.88&#xa0;kg/s at different apertures (<xref ref-type="fig" rid="F5">Figures 5E,F</xref>), indicating a minimal effect of the leakage aperture on the growth of the radius and evaporation rate. Under disparate conditions of atmospheric stability, the radius reached its zenith between 163&#xa0;s and 165&#xa0;s, with the lowest evaporation rate under unstable conditions at 31.88&#xa0;kg/s, and slightly higher under stable and neutral conditions at 33.62&#xa0;kg/s and 33&#xa0;kg/s, respectively (<xref ref-type="fig" rid="F5">Figures 5G,H</xref>). Atmospheric stability exerts a minor influence on liquid pool expansion and evaporation rate, as indicated by the coefficients <inline-formula id="inf65">
<mml:math id="m80">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf66">
<mml:math id="m81">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> in formula <xref ref-type="disp-formula" rid="e2">(2)</xref>. Subsequent research will investigate the effects of these factors on the distribution of concentrations and hazardous distances, providing scientific support for effective risk management and emergency preparedness.</p>
<p>A comprehensive analysis indicated that temperature was the primary factor influencing the growth of the evaporation rate. The impact of wind speed on the radius growth was negligible but significantly enhanced evaporation rate. The impact of leakage aperture and atmospheric stability was insignificant. Related studies (<xref ref-type="bibr" rid="B17">Galeev et al., 2013</xref>; <xref ref-type="bibr" rid="B19">Hu et al., 2024</xref>) have also emphasized the important role of environmental factors in chemical leakage accidents, in particular the significant effect of wind speed and temperature on the consequences of leakage.</p>
</sec>
<sec id="s3-1-2">
<title>3.1.2 Dynamic characteristics of concentration distribution</title>
<p>To explore the dynamic characteristics of concentration distribution, a specific scenario was chosen for detailed analysis: liquid benzene leakage under stable atmospheric conditions, featuring a 200&#xa0;mm aperture, a wind speed of 6&#xa0;m/s and a temperature of 50&#xb0;C. This study methodically examined the changes in concentration distribution within the hazardous distances for various AEGLs at 150&#xa0;s, 300&#xa0;s, 450&#xa0;s, and 600&#xa0;s. <xref ref-type="fig" rid="F6">Figure 6</xref> illustrates the concentration distribution at different times, where A-D, E-H, and I-N correspond to AEGL-1, AEGL-2, and AEGL-3 distances, respectively.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Hazardous ranges corresponding to AEGL-1 <bold>(A&#x2013;D)</bold>, AEGL-2 <bold>(E&#x2013;H)</bold>, and AEGL-3 <bold>(I&#x2013;L)</bold> at different time (T &#x3d; 150&#xa0;s, 300&#xa0;s, 450&#xa0;s, 600&#xa0;s).</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g006.tif"/>
</fig>
<p>Initially, at 150&#xa0;s, the hazardous range of AEGL-1 was predominantly near the leakage source (<xref ref-type="fig" rid="F6">Figure 6A</xref>). By 600&#xa0;s, the concentration range had spread to 2780.20&#xa0;m, revealing a significant downwind stretch while the lateral enlargement of the plume remained comparatively limited (<xref ref-type="fig" rid="F6">Figure 6D</xref>). Compared to AEGL-1, the diffusion rate and the hazardous range of AEGL-2 were markedly reduced. Notably, at 300 and 390&#xa0;s, the maximum AEGL-2 distance exhibited minimal change, suggesting a plateau in the diffusion speed and expansion range once a certain concentration was reached (<xref ref-type="fig" rid="F6">Figure 6F</xref>). Beyond 300&#xa0;s, both the downwind distance and plume width remained relatively stable, leading to a more homogeneous distribution of concentration (<xref ref-type="fig" rid="F6">Figures 6G,H</xref>). The diffusion speed and range of AEGL-3 showed an even more pronounced reduction (<xref ref-type="fig" rid="F6">Figure 6I&#x2013;L</xref>). By 270&#xa0;s, the hazardous range reached a steady state at 74.27&#xa0;m, highlighting the restricted diffusion range for high-concentration benzene over a brief period. The lateral expansion of the plume was notably constrained, primarily due to the dominance of wind speed over turbulent mixing, facilitating predominantly downwind diffusion. Consequently, wind speed emerges as a critical determinant in the plume diffusion process, determining the velocity of downwind diffusion (<xref ref-type="bibr" rid="B73">Gong et al., 2023</xref>). Meanwhile, initial release conditions, such as leakage rate and temperature, along with local turbulence, play collective roles in shaping the plume width and diffusion uniformity.</p>
</sec>
<sec id="s3-1-3">
<title>3.1.3 Dynamic characteristics of hazardous ranges</title>
<p>In the case of liquid benzene leakage, the hazardous consequences were evaluated using AEGLs distances. The mechanism of the change of AEGLs distances under the four main factors was analyzed by altering the environmental conditions, with the findings illustrated in <xref ref-type="fig" rid="F7">Figure 7</xref>. Notably, the AEGL-1 and AEGL-2 distances increased significantly as temperature rose. The trend for the AEGL-3 distance was only exhibited at higher temperatures. This phenomenon may be attributed to the fact that an increase in temperature elevated the saturated vapor pressure of benzene, thereby expediting the evaporation rate and diffusion process (<xref ref-type="bibr" rid="B61">Yu et al., 2021</xref>). Furthermore, for AEGL-3, the concentration value (31,000&#xa0;mg/m&#xb3;) represented a high concentration that may be life-threatening following exposure. In this study, it was observed that the distances of AEGL-3 were only present under higher temperatures and were relatively short. This suggested that elevated temperatures may facilitate rapid evaporation of benzene, yet may also facilitate its rapid diffusion and dilution, resulting in rapidly declining concentrations at a distance from the leakage source (<xref ref-type="bibr" rid="B69">Zhou et al., 2024</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Effects of different factors on the variation of AEGLs distances. <bold>(A&#x2013;C)</bold>, <bold>(D&#x2013;F)</bold>, <bold>(G&#x2013;I)</bold>, and <bold>(J&#x2013;L)</bold> indicate the effects of different wind speed, temperature, leakage aperture, and atmospheric stabilities on the AEGL-1, AEGL-2, and AEGL-3 distances, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g007.tif"/>
</fig>
<p>Wind speed significantly influenced the diffusion ranges of benzene, with wind speed increasing from 1&#xa0;m/s to 6&#xa0;m/s, the AEGL-1, AEGL-2, and AEGL-3 distances exhibiting different growth trends. The increase in diffusion distances was attributed to the turbulent mixing effect at higher wind speeds. However, the extent of this increase was limited, particularly as the AEGL-2 and AEGL-3 distances stabilized more quickly at higher wind speeds. The AEGL-3 distance initially rose with an increase in wind speed until it stabilized approximately 200&#xa0;s. The maximum distance of 73.93&#xa0;m was reached at a wind speed of 4&#xa0;m/s, after which it slightly decreased with further increases in wind speed. Before reaching a steady state in concentration distribution, wind speed primarily served as a mechanism for transporting the cloud over longer distances within the same time frame. Upon reaching a steady state, wind speed facilitated dilution in addition to transportation (<xref ref-type="bibr" rid="B67">Zhou et al., 2021</xref>). An increase in wind speed not only enhanced the dilution effect but also accelerated the diffusion speed, thereby narrowing the hazardous range. The impacts of leakage aperture and atmospheric stability on the hazardous distance were minimal. An incremental rise in the AEGL-1 distance was observed with the enlargement of leakage aperture, whereas the AEGL-2 and AEGL-3 distances exhibited negligible changes. Furthermore, the AEGL-1, AEGL-2, and AEGL-3 distances showed no significant variance under different atmospheric stabilities, indicating that over longer periods, atmospheric stability exerted minimal influence on diffusion distances.</p>
</sec>
</sec>
<sec id="s3-2">
<title>3.2 Correlation analysis</title>
<p>Pearson correlation analysis was employed to evaluate the linear relationship between the CFD-simulated methane concentration (C1) and various characteristic variables, including time, leakage aperture, wind speed, temperature, atmospheric stability, and downwind distance. The corresponding results are depicted in <xref ref-type="fig" rid="F8">Figure 8</xref>. Specifically, wind speed and downwind distance were negatively correlated with C1, with correlation coefficients of &#x2212;0.01 and &#x2212;0.48, indicating that an increase in wind speed and greater downwind distance resulted in reduced methane concentrations, respectively. Conversely, positive correlations were identified between C1 and variables including time, leakage aperture, temperature, and atmospheric stability, with coefficients of 0.16, 0.01, 0.20, and 0.02, respectively. The strong positive correlation between C1 and time and temperature indicated that higher concentrations were associated with longer leakage time and higher temperature. These findings reveal that there exists a significant but relatively weak correlation between C1 and the characteristic variables, and a nonlinear relationship among the characteristic variables. Given the complexity of the atmospheric diffusion mechanism, which involves nonlinear and dynamic processes affected by various factors, traditional linear models are not the optimal choice. Therefore, it is recommended that a nonlinear model be adopted for a more accurate representation of the complex variable interactions and effects. Furthermore, an analysis of the diffusion mechanism was conducted to robustly support the correlation between the variables, as detailed in the <xref ref-type="sec" rid="s10">Supplementary Text S2</xref>.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Correlation coefficients between characteristic variables and between characteristic variables and the target variable (C1), "&#xd7;" indicates that the correlation did not pass the significance test at the significance level &#x3b1; &#x3d; 0.05.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g008.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>3.3 Feasibility analysis of ML algorithms using CFD standard data</title>
<sec id="s3-3-1">
<title>3.3.1 Model performance evaluation</title>
<p>To evaluate the performance of the five&#xa0;ML models on CFD standard data, various evaluation metrics were calculated, as depicted in <xref ref-type="fig" rid="F9">Figure 9</xref>. <xref ref-type="fig" rid="F9">Figure 9A</xref> reveals that R<sup>2</sup> for the training set among these models varied from 0.962 to 0.999, and IOA varied from 0.990 to 0.999. Notably, R<sup>2</sup> and IOA of the XGBoost and LightGBM models were both 0.999, indicating nearly-perfect prediction accuracy. In terms of RMSE, the XGBoost model outperformed other models with a score of 181.669&#xa0;mg/m&#xb3;, closely followed by the LightGBM model, which scored 204.089&#xa0;mg/m<sup>3</sup>. Additionally, these models also exhibited outstanding MAE, with the XGBoost model at 85.742&#xa0;mg/m&#xb3; and the LightGBM model at 108.414&#xa0;mg/m&#xb3;, underscoring the exceptional predictive performance of the XGBoost model.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Performance evaluation of predictions based on MLP, RF, DT, XGBoost, and LightGBM models for standard <bold>(A)</bold> training data and <bold>(B)</bold> testing data.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g009.tif"/>
</fig>
<p>On the testing set, both the XGBoost and LightGBM models exhibited strong correlations with R<sup>2</sup> of 0.996 and 0.993, and IOA of 0.999 and 0.998, respectively (<xref ref-type="fig" rid="F9">Figure 9B</xref>). In contrast, despite the MLP and RF models exhibiting high R<sup>2</sup> on the training set (0.962 and 0.964, respectively) and acceptable R<sup>2</sup> on the testing set (0.894 and 0.968), their higher RMSE and MAE suggested a significantly lower prediction accuracy compared to the XGBoost and LightGBM models. The DT model performed well on the training set, with RMSE of 1546.323&#xa0;mg/m<sup>3</sup>. Nonetheless, its accuracy decreased on the testing set, with RMSE and MAE of 1483.873&#xa0;mg/m<sup>3</sup> and 686.351&#xa0;mg/m<sup>3</sup>, respectively, and slightly lower R<sup>2</sup> and IOA. This analysis indicates that the MLP and DT models may not be optimal for low-dimensional sample data. However, ensemble models such as the XGBoost and LightGBM models can effectively mitigate the risks of overfitting by integrating multiple simple models, thereby ensuring improved accuracy of concentration prediction.</p>
<p>In the field of environmental science, numerous studies (<xref ref-type="bibr" rid="B25">Li J. et al., 2021</xref>; <xref ref-type="bibr" rid="B62">Zang et al., 2021</xref>; <xref ref-type="bibr" rid="B57">Xu et al., 2022</xref>) have employed a range of ML algorithms to construct prediction models for air pollutant concentrations, with R<sup>2</sup> primarily falling within the range of 0.68&#x2013;0.88. In comparison, our models demonstrated a significant improvement in prediction accuracy. Moreover, in the field of risk assessment of accident consequences, related studies (<xref ref-type="bibr" rid="B35">Ni et al., 2020</xref>; <xref ref-type="bibr" rid="B51">Wang et al., 2023</xref>) have demonstrated the performance of ML models based on CFD simulation data, where R<sup>2</sup> of the models was higher than 0.90. The ML models constructed on the basis of idealized CFD data in our study, in particular the XGBoost model, not only matched but even outperformed these performance ranges reported by these studies. These results demonstrated the effectiveness of the XGBoost model in terms of prediction accuracy, and illustrated the capacity of the model to process complex and high-dimensional data. The findings suggested the potential applicability of the model in the field of environmental sciences.</p>
</sec>
<sec id="s3-3-2">
<title>3.3.2 Effects of model predictions on concentration accuracy</title>
<p>To further assess the accuracy of various models in predicting concentrations, a validation analysis was performed under a stable atmosphere scenario, characterized by a 200&#xa0;mm leakage aperture, a wind speed of 6&#xa0;m/s, and a temperature of 50&#xb0;C. Concentrations at different distances were compared, with the results presented in <xref ref-type="fig" rid="F10">Figure 10</xref>. This figure demonstrates that the MLP model was unable to accurately predict concentration distributions and trends at both near and distant distances, leading to unsatisfactory outcomes. Conversely, the other models showed improved accuracy in capturing the concentration trends. Notably, from distances of 10&#xa0;m&#x2013;500&#xa0;m, the predictive curves of these models closely aligned with the actual concentration curves, demonstrating high consistency. At a distance of 50&#xa0;m, all models except the MLP model produced predictions nearly identical to the actual concentrations, with the predictive and actual curves almost overlapping, indicating their robust performance in near-distance prediction. However, the accuracy of these predictions decreased as the distance increased. Beyond 1,000&#xa0;m, the MLP, DT, and RF models exhibited considerable deviations and were unable to accurately capture the actual concentration distribution and trends, highlighting their limitations in distant-distance concentration prediction. In contrast, the predictive curves of the XGBoost and LightGBM models remained closely aligned with the actual curves, demonstrating their capacity to handle large-scale and complex data effectively. Nevertheless, <xref ref-type="fig" rid="F10">Figure 10C</xref> clearly shows some deviations between the predictive curve of the LightGBM model and the actual concentration curve during abrupt increases. Although the LightGBM model exhibited a slightly stable trend aligning with the actual values in high concentration ranges (<xref ref-type="fig" rid="F10">Figures 10A,B</xref>), the XGBoost model adapted more quickly to near-actual values in rapidly changing concentrations (<xref ref-type="fig" rid="F10">Figures 10E,H</xref>). This indicated that the XGBoost model may provide more timely decision support in dynamic prediction scenarios. Considering their performance with respect to prediction latency and accuracy in high concentration intervals, the XGBoost model outperformed the LightGBM model, corroborating the findings discussed in <xref ref-type="sec" rid="s3-3-1">Section 3.3.1</xref>. These results provide a scientific framework for model selection in particular scenarios.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Comparison of model validation for concentration at different downwind distances: <bold>(A)</bold>, <bold>(B)</bold>, <bold>(C)</bold>, <bold>(D)</bold>, <bold>(E)</bold>, <bold>(F)</bold>, <bold>(G)</bold>, and <bold>(H)</bold> correspond to the predicted <italic>versus</italic> the true values of the different models at downwind distances of 10, 50, 100, 500, 1,000, 1,500, 2000, and 2,500&#xa0;m, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g010.tif"/>
</fig>
</sec>
</sec>
<sec id="s3-4">
<title>3.4 Evaluation of ML algorithms based on noisy data</title>
<sec id="s3-4-1">
<title>3.4.1 Model performance evaluation</title>
<p>In order to more closely match real-world measured data and to evaluate the generalizability of the model, noise is often introduced into the standard data to mimic real-world variations (<xref ref-type="bibr" rid="B28">Li X. et al., 2021</xref>). Therefore, Gaussian noise was incorporated into the CFD standard data and the mean and variance of the Gaussian noise were adjusted to generate datasets with different noise levels. The performance of each model on the training and testing data was evaluated with a noise scale of 0.5, and the results of this evaluation are depicted in <xref ref-type="fig" rid="F11">Figure 11</xref>.</p>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>Performance evaluation of predictions based on MLP, RF, DT, XGBoost, and LightGBM models for noisy <bold>(A)</bold> training data and <bold>(B)</bold> testing data.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g011.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="F11">Figure 11</xref> shows that the MLP model achieved RMSE and MAE of 3062.884&#xa0;mg/m<sup>3</sup> and 1430.555&#xa0;mg/m<sup>3</sup> on the training set, and 3078.269&#xa0;mg/m<sup>3</sup> and 1494.641&#xa0;mg/m<sup>3</sup> on the testing set, respectively. Although the DT and RF models performed slightly better in terms of RMSE and MAE, they still exhibited significant sensitivity to the presence of noise. In comparison, both the XGBoost and LightGBM models demonstrated exceptional performance across all evaluation metrics, with the lowest RMSE and MAE. RMSE for the XGBoost and LightGBM models on the training data were 1856.175&#xa0;mg/m<sup>3</sup> and 1831.244&#xa0;mg/m<sup>3</sup>, respectively, while MAE were 778.301&#xa0;mg/m<sup>3</sup> and 785.941&#xa0;mg/m<sup>3</sup>, respectively. R<sup>2</sup> was 0.973 for the XGBoost model and 0.974 for the LightGBM model, with both models achieving IOA of 0.993. The difference in performance between the two models was minimal, with the LightGBM model slightly outperforming in terms of predictive accuracy. On the testing data, RMSE for the XGBoost and LightGBM models were 2091.083&#xa0;mg/m<sup>3</sup> and 2162.072&#xa0;mg/m<sup>3</sup>, with MAE were 918.705&#xa0;mg/m<sup>3</sup> and 41.887&#xa0;mg/m<sup>3</sup>, respectively. R<sup>2</sup> was 0.963 and 0.961, and IOA was 0.991 and 0.990, respectively. Here, the performance of the XGBoost model was more pronounced. Overall, both models demonstrated high robustness in processing and predicting noisy data, which is vital for the effective operation of ML algorithms in diverse real-world situations. Nevertheless, the XGBoost model displayed an advantage in predictive accuracy and stability.</p>
<p>Previous studies (<xref ref-type="bibr" rid="B35">Ni et al., 2020</xref>; <xref ref-type="bibr" rid="B51">Wang et al., 2023</xref>) have typically constructed ML prediction models based on idealized data from CFD simulations. However, in real-world environments, real data frequently contain noise due to monitoring equipment failures and measurement errors. This study sought to assess the reliability of the predictive performance of ML models based on noisy data by adding noise to the data to reflect the real-world situation, and enhance the robustness and generalization of the models. The results demonstrated that the XGBoost model exhibited excellent predictive performance despite the presence of noise.</p>
</sec>
<sec id="s3-4-2">
<title>3.4.2 Effects of model predictions on concentration accuracy</title>
<p>A comparative analysis of concentration predictions at various distances from the source was performed using noisy data, with the results illustrated in <xref ref-type="fig" rid="F12">Figure 12</xref>. The analysis clearly indicated that as the downwind distance increases, the difference between the predictions of the models and the noise values also increased, indicating a higher level of uncertainty in the prediction. At near distances, the&#x2019; predictions of all models were closer to the actual values. However, at distant distances, the prediction curves become more volatile, with the MLP model&#x2019;s predictions deviating significantly from the true values. The MLP model was ineffective in predicting noisy data. The DT and RF models, while providing predictions closer to the true values, did not accurately reflect the overall trends. Conversely, the XGBoost and LightGBM models demonstrated exceptional predictive performance, accurately capturing changes in concentration trends at both near and distant distances. This evidence reinforces the notion that ensemble models, especially the XGBoost and LightGBM models, exhibit strong generalization capabilities and robustness in both standard and noisy data, excelling in predicting concentration distributions and trends effectively. Overall, the inherent features of ensemble models, such as model averaging, robustness, and overfitting prevention, contribute to their effectiveness in making reliable predictions within noisy environments (<xref ref-type="bibr" rid="B12">Cong et al., 2023</xref>). These attributes render ensemble models indispensable tools for addressing the complexity and uncertainty inherent in real-world data.</p>
<fig id="F12" position="float">
<label>FIGURE 12</label>
<caption>
<p>The comparison of model validation for concentrations at different downwind distances: <bold>(A)</bold>, <bold>(B)</bold>, <bold>(C)</bold>, <bold>(D)</bold>, <bold>(E)</bold>, <bold>(F)</bold>, <bold>(G)</bold>, <bold>(H)</bold> correspond to the predicted values <italic>versus</italic> the true values of the different models at downwind distances of 10, 50, 100, 500, 1,000, 1,500, 2000, 2,500&#xa0;m, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g012.tif"/>
</fig>
</sec>
<sec id="s3-4-3">
<title>3.4.3 Analysis of predictive application using the XGBoost model</title>
<p>In emergency rescue operations, accurately predicting the temporal distribution of hazardous chemical concentration over time and the corresponding hazardous distances for concentration limits is essential for devising the effective emergency response strategies. This study evaluated the efficiency of the XGBoost model in predicting the diffusion of liquid benzene leakage following a leakage from a tank with a 200&#xa0;mm aperture under conditions of a 6&#xa0;m/s wind speed, a 50&#xb0;C temperature, and stable atmospheric conditions. The aim is to replicate an industrial scenario with specific environmental parameters. The comparison between CFD simulation results and hazardous distance predictions from the XGBoost model, as presented in <xref ref-type="fig" rid="F13">Figure 13</xref>, underscores the exceptional ability of the model in accurately predicting benzene concentration levels and determining hazardous distances. Specifically, the XGBoost model demonstrates the capacity to accurately predict concentrations at different distances, whether near the leakage source or at distant distances. Notably, <xref ref-type="fig" rid="F13">Figure 13A</xref> confirms the accuracy of the model in matching saturation concentrations, whereas <xref ref-type="fig" rid="F13">Figures 13B,C</xref> indicate a minor temporal delay in the model&#x2019;s predictions compared to the actual values, suggesting a negligible hysteresis effect without compromising overall accuracy. Moreover, the model demonstrated exceptional alignment with real-world distances for AEGL-1, AEGL-2, and AEGL-3, with minimal relative errors. Specifically, it predicted distances of 2705.1&#xa0;m, 378.4&#xa0;m, and 74.44&#xa0;m against the true distances of 2780.2&#xa0;m, 368.9&#xa0;m, and 74.27&#xa0;m, achieving relative errors of 2.70%, 2.58%, and 0.23%, respectively. Compared to the CFD model, the enhanced efficacy and speed exhibited by the XGBoost model indicate that ML algorithms may significantly improve the real-time emergency response capabilities, potentially reducing the risks these accidents pose to humans and the environment. In addition, the XGBoost model exhibited a markedly superior predictive efficiency compared to the CFD model, resulting in significant savings in computational costs. The model took only 0.218&#xa0;s to output the prediction results when running on a computer with an AMD Ralon R7 6800H CPU and 32G of RAM, while the CFD model took about 3&#xa0;h to complete a simulation on a computer with an 11th Gen Intel<sup>&#xae;</sup> Core (TM) i5-11400H CPU and 8G of RAM for this leakage scenario. It should be noted that the simulation time may vary depending on the specific leakage scenario under consideration. Obviously, using ML algorithms can significantly improve the prediction efficiency and meet the current demand for dynamic, accurate and fast predictions in smart parks.</p>
<fig id="F13" position="float">
<label>FIGURE 13</label>
<caption>
<p>Comparison of predicted and true values of concentrations at various downwind distances and hazardous distances based on the XGBoost model, <bold>(A)</bold>, <bold>(B)</bold>, and <bold>(C)</bold> correspond to downwind distances of 10, 100, and 1,000&#xa0;m, respectively. <bold>(D)</bold>, <bold>(E)</bold>, and <bold>(F)</bold> correspond to AEGL-1, AEGL-2, and AEGL-3 distances, respectively.</p>
</caption>
<graphic xlink:href="fenvs-12-1409072-g013.tif"/>
</fig>
<p>The precise prediction of hazardous distances is crucial for assessing the consequences of leakage accidents and for immediate emergency response measures. The investigation of XGBoost models that not only provide accurate predictions but also maintain prediction efficiency has enabled the fast provision of prediction ranges for emergency response. It is recommended that further development and integration of ML techniques for the prediction and management of hazardous situation be a priority in industrial safety and environmental protection strategies.</p>
</sec>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<title>4 Conclusion</title>
<p>This study examined the consequences of chemical leakage accidents by simulating Burro series experiments using the CFD (PHOENICS version 6.0) model. The simulations were benchmarked against Burro nine data, revealing a strong correlation between the simulated and observed concentrations within acceptable discrepancies, thereby affirming the efficacy of the CFD model in simulating the heavy gas leakage diffusion. Using liquid benzene as an example, a CFD-based dynamic model was developed to analyze the consequences of heavy gas leakage diffusion, examining the impacts of wind speed, temperature, leakage aperture, and atmospheric stability. The analysis underscored the pivotal roles of wind speed and temperature in influencing the distribution patterns of liquid benzene concentrations and AEGLs distances over extended periods. In contrast, leakage aperture and atmospheric stability minimally affected the hazardous distances. Furthermore, five&#xa0;ML models were developed using CFD standard and noisy data. The performance assessment revealed that the XGBoost model surpassed the other models for concentration simulation, demonstrating resilience to noise interference. Consequently, a fast prediction model for the dynamic diffusion of heavy gas leakage based on the XGBoost model was established. This model&#x2019;s precision was confirmed by comparing actual and predicted concentrations at various downwind distances and hazardous distances. The relative errors between the actual values and predictions of AEGL-1, AEGL-2, and AEGL-3 distances were 2.70%, 2.58%, and 0.23%, respectively. More importantly, the XGBoost model demonstrated exceptional efficiency, generating predictions in only 0.218&#xa0;s, significantly faster than the CFD model. This efficiency, coupled with reduced computational demands, positioned ML algorithms as vital tools for dynamic and precise emergency response planning in smart parks, highlighting their potential in enhancing future response strategies.</p>
<p>However, it is essential to acknowledge the uncertainties and limitations inherent in our study. The reliance on data-driven models, particularly the opaque nature of ML algorithms, introduces uncertainties in understanding dynamic mechanisms. Additionally, despite utilizing CFD outputs augmented with Gaussian noise, it still differs from actual leakage scenarios. Furthermore, the applicability of our model is confined to open-space leakage incidents, omitting the influence of complex terrains and various underlying surface types on predictive accuracy. The efficacy of the XGBoost model in handling complex terrains or enclosed spaces necessitates further investigation. This opens up new avenues for our future research in this field. Future directions include incorporating real observational data, employing sophisticated data assimilation techniques for improved precision, and expanding the model to encompass a wider array of factors and scenarios.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>CF: Writing&#x2013;original draft, Writing&#x2013;review and editing. HG: Writing&#x2013;review and editing. YZ: Writing&#x2013;review and editing. WM: Writing&#x2013;review and editing. QY: Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article. The author(s) declare that no financial support was received for the research, authorship, and/or publication of this article.</p>
</sec>
<ack>
<p>We really appreciate the editors and reviewers for their meaningful comments for improving our manuscript.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fenvs.2024.1409072/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fenvs.2024.1409072/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet2.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.XLSX" id="SM2" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmed</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Adnan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Janssens</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wets</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A Route to School Informational Intervention for Air Pollution Exposure Reduction</article-title>. <source>Sustain. Cities Soc.</source> <volume>53</volume>, <fpage>101965</fpage>. <pub-id pub-id-type="doi">10.1016/j.scs.2019.101965</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arsic</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mihajlovi&#x107;</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Nikoli&#x107;</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>&#x17d;ivkovi&#x107;</surname>
<given-names>&#x17d;.</given-names>
</name>
<name>
<surname>Pani&#x107;</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of Ozone Concentration in Ambient Air Using multilinear Regression and the Artificial Neural Networks Methods</article-title>. <source>Ozone Sci. Eng.</source> <volume>42</volume>, <fpage>79</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1080/01919512.2019.1598844</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Barjoee</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Elmi</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Varaoon</surname>
<given-names>V. T.</given-names>
</name>
<name>
<surname>Keykhosravi</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Karimi</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Hazards of Toluene Storage Tanks in a Petrochemical Plant: Modeling Effects, Consequence Analysis, and Comparison of Two Modeling Programs</article-title>. <source>Environ. Sci. Pollut. Res. Int.</source> <volume>29</volume>, <fpage>4587</fpage>&#x2013;<lpage>4615</lpage>. <pub-id pub-id-type="doi">10.1007/s11356-021-15864-5</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random Forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/a:1010933404324</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bruha</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>From Machine Learning to Knowledge Discovery: Survey of Preprocessing and Postprocessing</article-title>. <source>Intell. Data Anal.</source> <volume>4</volume>, <fpage>363</fpage>&#x2013;<lpage>374</lpage>. <pub-id pub-id-type="doi">10.3233/ida-2000-43-413</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bu</surname>
<given-names>F. X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Real scenario analysis of buried natural gas pipeline leakage based on soil-atmosphere coupling</article-title>. <source>Int. J. Press. Vessels Pip.</source> <volume>199</volume>, <fpage>104713</fpage>. <pub-id pub-id-type="doi">10.1016/j.ijpvp.2022.104713</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chai</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Review of Machine Learning-based 5G for Industrial Internet of Things</article-title>. <source>Inf. Control</source> <volume>52</volume>, <fpage>257</fpage>&#x2013;<lpage>276</lpage>. <pub-id pub-id-type="doi">10.13976/j.cnki.xk.2023.2574</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Comparative Analysis of Hourly PM_(2.5) Prediction Based on Multiple Machine Learning Models</article-title>. <source>J Nanjing For. Univ.</source> <volume>46</volume>, <fpage>152</fpage>&#x2013;<lpage>160</lpage>. <pub-id pub-id-type="doi">10.12302/j.issn.1000-2006.202106023</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guestrin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>XGBoost: A Scalable Tree Boosting System</article-title>,&#x201d; in <conf-name>Proceedings of the 22nd Acm Sigkdd International Conference on Knowledge Discovery and Data Mining</conf-name>. <publisher-loc>San Francisco, California, USA</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>, <fpage>785</fpage>&#x2013;<lpage>794</lpage>.</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Pang</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Simulation Study on Consequences of Ethylene Oxide Storage Tank Leakage Accidents in Summer and Winter</article-title>. <source>Saf. Environ. Eng.</source> <volume>29</volume>, <fpage>156</fpage>&#x2013;<lpage>162</lpage>. <pub-id pub-id-type="doi">10.13578/j.cnki.issn.1671-1556.20211463</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The Integrated Forecasting Model of Stock Index Based on CEEMD-CNN-LSTM</article-title>. <source>Syst. Eng.</source> <volume>41</volume>, <fpage>104</fpage>&#x2013;<lpage>116</lpage>.</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ehteram</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Panahi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y. F.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Elshafie</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predicting Evaporation with Optimized Artificial Neural Network Using Multi-Objective Salp Swarm Algorithm</article-title>. <source>Environ. Sci. Pollut. Res. Int.</source> <volume>29</volume>, <fpage>10675</fpage>&#x2013;<lpage>10701</lpage>. <pub-id pub-id-type="doi">10.1007/s11356-021-16301-3</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Duan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The Seasonal Differential Effects of Meteorological Parameters on Atmospheric Pollutants and the Prediction Model Comparison: A Case Study of Shenzhen</article-title>. <source>Environ. Pollut. Control</source> <volume>41</volume>, <fpage>541</fpage>&#x2013;<lpage>546</lpage>. <pub-id pub-id-type="doi">10.15985/j.cnki.1001-3865.2019.05.009</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>L. I.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Bernoulli&#x2019;s Equation for Compressible Flow</article-title>. <source>Coll. Phys.</source> <volume>27</volume>, <fpage>15</fpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1000-0712.2008.08.005</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>W.-X.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X. N.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>F. J.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Elucidating the Impacts of Meteorology and Emission Changes on Concentrations of Major Air Pollutants in Major Cities in the Yangtze River Delta Region Using a Machine Learning De-weather Method</article-title>. <source>Environ. Sci.</source> <volume>44</volume>, <fpage>5879</fpage>&#x2013;<lpage>5888</lpage>. <pub-id pub-id-type="doi">10.13227/j.hjkx.202301119</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galeev</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Salin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ponikarov</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Consequence Analysis of Aqueous Ammonia Spill Using Computational Fluid Dynamics</article-title>. <source>J. Loss Prev. Process Ind.</source> <volume>26</volume>, <fpage>628</fpage>&#x2013;<lpage>638</lpage>. <pub-id pub-id-type="doi">10.1016/j.jlp.2012.12.006</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Air Quality Prediction Approach Based on Integrating Forecasting Dataset</article-title>. <source>J. Shandong Univ. Eng. Sci.</source> <volume>50</volume>, <fpage>91</fpage>&#x2013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.6040/j.issn.1672-3961.0.2019.404</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname>
<given-names>H. X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y. Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>G. Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y. Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Kuang</surname>
<given-names>Z. X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Quantifying the spatial representativeness of carbon flux footprints of a grassland ecosystem in the semi-arid region</article-title>. <source>J. Geophy. Res. Atmosph.</source> <volume>128</volume>. <pub-id pub-id-type="doi">10.1029/2022JD038269</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>X. M.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Numerical Study on Leakage Dispersion Pattern and Hazardous Area of Ammonia Storage Tanks</article-title>. <source>Energy Technol.</source> <volume>12</volume>, <fpage>2301067</fpage>. <pub-id pub-id-type="doi">10.1002/ente.202301067</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiao</surname>
<given-names>Z. R.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Deep Learning Based Quantitative Property-Consequence Relationship (QPCR) Models For Toxic Dispersion Prediction</article-title>. <source>Process Saf. Environ. Prot.</source> <volume>152</volume>, <fpage>352</fpage>&#x2013;<lpage>360</lpage>. <pub-id pub-id-type="doi">10.1016/j.psep.2021.06.019</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Construction of Intelligent Emergency Rescue Platform for Chemical Industry Park</article-title>. <source>Chem. Ind. Eng. Prog.</source> <volume>36</volume>, <fpage>1544</fpage>&#x2013;<lpage>1549</lpage>. <pub-id pub-id-type="doi">10.16085/j.issn.1000-6613.2017.04.051</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Hourly PM2.5 Prediction and Its Comparative Analysis Under Multi-Machine Learning Model</article-title>. <source>China Environ. Sci.</source> <volume>40</volume>, <fpage>1895</fpage>&#x2013;<lpage>1905</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1000-6923.2020.05.005</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koopman</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Cederwall</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ermak</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Goldwire</surname>
<given-names>H.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Hogan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>McClure</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>1982</year>). <article-title>Analysis of Burro Series 40-m3 LNG Spill Experiments</article-title>. <source>J. Hazard. Mater.</source> <volume>6</volume>, <fpage>43</fpage>&#x2013;<lpage>83</lpage>. <pub-id pub-id-type="doi">10.1016/0304-3894(82)80034-4</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Study on Impact of Leakage of Toxic and Hazardous Gases on Habitability of Main Control Room Based on ALOHA</article-title>. <source>Nucl. Power Eng.</source> <volume>40</volume>, <fpage>126</fpage>&#x2013;<lpage>130</lpage>. <pub-id pub-id-type="doi">10.13832/j.jnpe.2019.01.0126</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2021a</year>). <article-title>Optimization of Numerical Simulation in Xi&#x2019;an Based on Machine Learning Methods</article-title>. <source>Res. Environ. Sci.</source> <volume>34</volume>, <fpage>872</fpage>&#x2013;<lpage>881</lpage>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Characteristics of Surface Layer Wind Speed Profiles over Different Underlying Surfaces</article-title>. <source>Resour. Sci.</source> <volume>33</volume>, <fpage>2005</fpage>&#x2013;<lpage>2010</lpage>.</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Shan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Intelligent Approach for Analyzing Surveillance Videos in Urban Emergency Management</article-title>. <source>Comput. Eng. Appl.</source> <volume>53</volume>, <fpage>154</fpage>&#x2013;<lpage>160</lpage>. <pub-id pub-id-type="doi">10.3778/j.issn.1002-8331.1606-0382</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021b</year>). <article-title>Soft Prediction of Coal-mine Gas Concentration through the Mixture of Gaussian Processes Under the Noisy Input Prediction Strategy</article-title>. <source>J. Signal. P</source> <volume>37</volume>, <fpage>2031</fpage>&#x2013;<lpage>2040</lpage>. <pub-id pub-id-type="doi">10.16798/j.issn.1003-0530.2021.11.003</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ou</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021c</year>). <article-title>A Comparative Study on Edictive Effect of PM2.5 in Beijing Based on Tree Models</article-title>. <source>Environ. Eng.</source> <volume>39</volume>, <fpage>106</fpage>&#x2013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.13205/j.hjgc.202106016</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Substances of Very High Concern: Challenge to Risk Management System, Capability and Fundamental Research of Chemicals in China</article-title>. <source>Chin. Sci. Bull.</source> <volume>58</volume>, <fpage>2643</fpage>&#x2013;<lpage>2650</lpage>. <pub-id pub-id-type="doi">10.1360/972013-231</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ouyang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A Quantitative Noise Method to Evaluate Machine Learning Algorithm on Multi-Fidelity Data</article-title>. <source>J. Chin. Ceram. Soc.</source> <volume>51</volume>, <fpage>405</fpage>&#x2013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.14062/j.issn.0454-5648.20220811</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Numerical Simulation Analysis of Fire Hazard from Leakage and Diffusion of Vinyl Chloride in Different Atmospheric Environments</article-title>. <source>Fire-Basel</source> <volume>5</volume>, <fpage>36</fpage>. <pub-id pub-id-type="doi">10.3390/fire5020036</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Adjusting PM_(2.5) Prediction of the Numerical Air Quality Forecast Model Based on Machine Learning Methods in Chengyu Region</article-title>. <source>Acta Sci. Circumstantiae</source> <volume>40</volume>, <fpage>4419</fpage>&#x2013;<lpage>4431</lpage>. <pub-id pub-id-type="doi">10.13671/j.hjkxxb.2020.0317</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname>
<given-names>Z. W.</given-names>
</name>
<name>
<surname>Dey</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Christopher</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Balyan</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>A Review of Statistical Methods Used for Developing Large-Scale and Long-Term PM2.5 Models from Satellite Data</article-title>. <source>Remote Sens. Environ.</source> <volume>269</volume>, <fpage>112827</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2021.112827</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ni</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Toxic Gas Dispersion Prediction For Point Source Emission Using Deep Learning Method</article-title>. <source>Hum. Ecol. Risk Assess.</source> <volume>26</volume>, <fpage>557</fpage>&#x2013;<lpage>570</lpage>. <pub-id pub-id-type="doi">10.1080/10807039.2018.1526632</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nielsen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Olsen</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Fredenslund</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Prediction of Isothermal Evaporation Rates of Pure Volatile Organic-Compounds in Occupational Environments-A Theoretical Approach Based on Laminar Bouundary-Layer Theory</article-title>. <source>Ann. Occup. Hyg.</source> <volume>39</volume>, <fpage>497</fpage>&#x2013;<lpage>511</lpage>. <pub-id pub-id-type="doi">10.1016/0003-4878(95)00032-a</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Real-Time Environment Risk Analysis for Accident Release of Hazardous Materials Around Tank Area</article-title>. <source>Acta Sci. Circumstantiae</source> <volume>24</volume>, <fpage>539</fpage>&#x2013;<lpage>544</lpage>. <pub-id pub-id-type="doi">10.3321/j.issn:0253-2468.2004.03.030</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A PM (2.5) Prediction Model Based on Deep Learning and Random Forest</article-title>. <source>Natl. Remote Sens. Bull.</source> <volume>27</volume>, <fpage>430</fpage>&#x2013;<lpage>440</lpage>. <pub-id pub-id-type="doi">10.11834/jrs.20210504</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qiu</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Estimating Contaminant Source in Chemical Industry Park Using UAV-Based Monitoring Platform, Artificial Neural Network and Atmospheric Dispersion Simulation</article-title>. <source>Rsc Adv.</source> <volume>7</volume>, <fpage>39726</fpage>&#x2013;<lpage>39738</lpage>. <pub-id pub-id-type="doi">10.1039/c7ra05637k</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qiu</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Atmospheric Dispersion Prediction and Source Estimation of Hazardous Gas Using Artificial Neural Network, Particle Swarm Optimization and Expectation Maximization</article-title>. <source>Atmos. Environ.</source> <volume>178</volume>, <fpage>158</fpage>&#x2013;<lpage>163</lpage>. <pub-id pub-id-type="doi">10.1016/j.atmosenv.2018.01.056</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaik</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Benjapolakul</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Pedapati</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Bingi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Thien Le</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Asdornwised</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Recurrent Neural Network-Based Model for Estimating the Life Condition of a Dry Gas Pipeline</article-title>. <source>Process Saf. Environ. Prot.</source> <volume>164</volume>, <fpage>639</fpage>&#x2013;<lpage>650</lpage>. <pub-id pub-id-type="doi">10.1016/j.psep.2022.06.047</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Shaik</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Pedapati</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Othman</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Dzubir</surname>
<given-names>F. A. B. A.</given-names>
</name>
</person-group> (<year>2023</year>). &#x201c;<article-title>A Case Study to Predict Structural Health of a Gasoline Pipeline Using ANN and GPR Approaches</article-title>,&#x201d; in <source>ICPER 2020</source>. <publisher-loc>Singapore</publisher-loc>: <publisher-name>Springer Nature Singapore</publisher-name>, <fpage>611</fpage>&#x2013;<lpage>624</lpage>.</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaik</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Jongkittinarukorn</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Benjapolakul</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Bingi</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>A Novel Neural Network-Based Framework to Estimate Oil and Gas Pipelines Life with Missing Input Parameters</article-title>. <source>Sci. Rep.</source> <volume>14</volume>, <fpage>4511</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-024-54964-3</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>So</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Koo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yoon</surname>
<given-names>E. S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>The Estimation of Hazardous Gas Release Rate Using Optical Sensor and Neural Network</article-title>. <source>20th Eur. Symposium Comput. Aided Process Eng.</source> <volume>28</volume>, <fpage>199</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1016/s1570-7946(10)28034-3</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Safety Exclusive Distance of LNG Dense Gas Dispersion and Its Influencing Factors</article-title>. <source>Nat. Gas. Ind.</source> <volume>30</volume>, <fpage>110</fpage>&#x2013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.3787/j.issn.1000-0976.2010.07.029</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Utikar</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Pareek</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Computational Fluid Dynamics Analysis of Liquefied Natural Gas Dispersion for Risk Assessment Strategies</article-title>. <source>J. Loss Prev. Process Ind.</source> <volume>26</volume>, <fpage>117</fpage>&#x2013;<lpage>128</lpage>. <pub-id pub-id-type="doi">10.1016/j.jlp.2012.10.002</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Terzioglu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Iskender</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Modeling the Consequences of Gas Leakage and Explosion Fire in Liquefied Petroleum Gas Storage Tank in Istanbul Technical University, Maslak Campus</article-title>. <source>Process Saf. Prog.</source> <volume>40</volume>, <fpage>319</fpage>&#x2013;<lpage>326</lpage>. <pub-id pub-id-type="doi">10.1002/prs.12263</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The Real-Time Estimation of Hazardous Gas Dispersion by the Integration of Gas Detectors, Neural Network and Gas Dispersion Models</article-title>. <source>J. Hazard. Mater.</source> <volume>300</volume>, <fpage>433</fpage>&#x2013;<lpage>442</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhazmat.2015.07.028</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Wind Field Reconstruction for the Dispersion Modeling of Accidental Chemical Spills on Complex Geometry</article-title>. <source>Chin. J. Chem. Eng.</source> <volume>27</volume>, <fpage>2712</fpage>&#x2013;<lpage>2724</lpage>. <pub-id pub-id-type="doi">10.1016/j.cjche.2019.02.029</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Research On XGBoost Prediction Method for Emergency Rescue Area of Liquid Ammonia Leakage</article-title>. <source>J. Saf. Environ.</source> <volume>23</volume>, <fpage>1482</fpage>&#x2013;<lpage>1489</lpage>. <pub-id pub-id-type="doi">10.13637/j.issn.1009-6094.2022.2546</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Intelligent Park Power System Management Platform Based on Big Data</article-title>. <source>Chin. J. Power Sources</source> <volume>41</volume>, <fpage>1637</fpage>&#x2013;<lpage>1639</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1002-087X.2017.11.041</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Air Pollution Impact Prediction of Chemical Industry Park Based on Ensemble Learning Strategy</article-title>. <source>Oper. Res. Manage. Sci.</source> <volume>30</volume>, <fpage>127</fpage>&#x2013;<lpage>134</lpage>. <pub-id pub-id-type="doi">10.12005/orms.2021.0360</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Pinker</surname>
<given-names>R. T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Himawari-8-Derived Diurnal Variations in Ground-Level PM2.5 Pollution Across China Using The Fast Space-Time Light Gradient Boosting Machine (LightGBM)</article-title>. <source>Atmos. Chem. Phys.</source> <volume>21</volume>, <fpage>7863</fpage>&#x2013;<lpage>7880</lpage>. <pub-id pub-id-type="doi">10.5194/acp-21-7863-2021</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>A Missing Values Filling Algorithm Based on Random Forest for Non-Linear Noisy Datasets</article-title>. <source>Comput. Appl. Softw.</source> <volume>30</volume>, <fpage>51</fpage>&#x2013;<lpage>53</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1000-386x.2013.07.015</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>L. W.</given-names>
</name>
<name>
<surname>Qiao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jar</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Investigation on Natural Gas Leakage and Diffusion Characteristics Based on CFD</article-title>. <source>Gas. Sci. Eng.</source> <volume>123</volume>, <fpage>205238</fpage>. <pub-id pub-id-type="doi">10.1016/j.jgsce.2024.205238</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Man</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Simulation of Daily PM_(2.5) Based on MODIS Data and Multi-Machine Learning Method</article-title>. <source>China Environ. Sci.</source> <volume>42</volume>, <fpage>2523</fpage>&#x2013;<lpage>2529</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1000-6923.2022.06.005</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bi</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Numerical Simulation of Heavy Gas Dispersion</article-title>. <source>Cryogenics</source>, <fpage>45</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1000-6516.2018.03.010</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Application of Random Forests and Decision Trees in the Prognosis of Upper Gastrointestinal Bleeding in Patients with Liver Cirrhosis</article-title>. <source>Chin. J. Health Stat.</source> <volume>36</volume>, <fpage>162</fpage>&#x2013;<lpage>166</lpage>.</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Pu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Numerical Study on the Influence of Environmental Factors on the Diffusion Process of Liquid Oxygen Leakage</article-title>. <source>J. Xi&#x2019;an Jiaot. Univ.</source> <volume>55</volume>, <fpage>119</fpage>&#x2013;<lpage>129</lpage>. <pub-id pub-id-type="doi">10.7652/xjtuxb202108015</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Tree-Based Ensemble Deep Learning Model for Spatiotemporal Surface Ozone (O3) Prediction and Interpretation</article-title>. <source>Int. J. Appl. Earth Obs.</source> <volume>103</volume>, <fpage>102516</fpage>. <pub-id pub-id-type="doi">10.1016/j.jag.2021.102516</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Lijun</surname>
<given-names>W. E. I.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Review on Atmospheric Dispersion Response to Chemical Models for Emergency Accidents</article-title>. <source>China Saf. Sci. J.</source> <volume>17</volume>, <fpage>12</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1003-3033.2007.06.002</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Trend Analysis and Forecast of PM2.5 in Fuzhou, China Using the ARIMA Model</article-title>. <source>Ecol. Indic.</source> <volume>95</volume>, <fpage>702</fpage>&#x2013;<lpage>710</lpage>. <pub-id pub-id-type="doi">10.1016/j.ecolind.2018.08.032</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X. B.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Computational Fluid Dynamics Study on Liquefied Natural Gas Dispersion with Phase Change of Water</article-title>. <source>Int. J. Heat. Mass Tran.</source> <volume>91</volume>, <fpage>347</fpage>&#x2013;<lpage>354</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijheatmasstransfer.2015.07.117</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Study on Method of Regional Risk Assessment for Urban Major Hazard</article-title>. <source>J. Saf. Sci. Technol.</source> <volume>10</volume>, <fpage>158</fpage>&#x2013;<lpage>164</lpage>. <pub-id pub-id-type="doi">10.11731/j.issn.1673-193x.2014.09.027</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Numerical Simulation of the Effect of Wind Speed on LNG Leakage and the Diffusion Process</article-title>. <source>J. Saf. Environ.</source> <volume>21</volume>, <fpage>285</fpage>&#x2013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.13637/j.issn.1009-6094.2019.0909</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Research Advances of Heavy Gas Dispersion</article-title>. <source>J. Saf. Environ.</source> <volume>12</volume>, <fpage>242</fpage>&#x2013;<lpage>247</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1009-6094.2012.03.057</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Z. Q.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>The Effects of Ambient Temperature and Atmospheric Humidity on the Diffusion Dynamics of Hydrogen Fluoride Gas Leakage Based on the Computational Fluid Dynamics Method</article-title>. <source>Toxics</source> <volume>12</volume>, <fpage>184</fpage>. <pub-id pub-id-type="doi">10.3390/toxics12030184</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Research on Influencing Factors in the Process of Gas Leakage and Dispersion</article-title>. <source>Chem. Eng. Oil Gas.</source> <volume>38</volume>, <fpage>354</fpage>&#x2013;<lpage>358</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1007-3426.2009.04.024</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Y. Z.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y. X.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J. X.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Atmospheric Ozone Concentration Prediction in Nanjing Based on LightGBM</article-title>. <source>Environ. Sci.</source> <volume>44</volume>, <fpage>3685</fpage>&#x2013;<lpage>3694</lpage>. <pub-id pub-id-type="doi">10.13227/j.hjkx.202208095</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Mu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2023b</year>). <article-title>Research on the Data-Driven Model for Estimating the Near-Surface PM_(2.5) Concentration in Anhui Province Using FY-4A Remote Sensing Data</article-title>. <source>Acta Sci. Circumstantiae</source> <volume>43</volume>, <fpage>196</fpage>&#x2013;<lpage>205</lpage>. <pub-id pub-id-type="doi">10.13671/j.hjkxxb.2023.0169</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>