<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">887446</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2022.887446</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Prediction of River Pollution Under the Rainfall-Runoff Impact by Artificial Neural Network: A Case Study of Shiyan River, Shenzhen, China</article-title>
<alt-title alt-title-type="left-running-head">Tian et al.</alt-title>
<alt-title alt-title-type="right-running-head">Prediction of Rainfall-Runoff Pollution</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Tian</surname>
<given-names>Zhan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/951632/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yu</surname>
<given-names>Ziwei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Yifan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1492828/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ke</surname>
<given-names>Qian</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Liu</surname>
<given-names>Junguo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1617126/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Luo</surname>
<given-names>Hongyan</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tang</surname>
<given-names>Yingdong</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Environmental Science and Engineering</institution>, <institution>Southern University of Science and Technology</institution>, <addr-line>Shenzhen</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Pengcheng Laboratory</institution>, <addr-line>Shenzhen</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Delft University of Technology</institution>, <addr-line>Delft</addr-line>, <country>Netherlands</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Meteorological Bureau of Shenzhen Municipality</institution>, <addr-line>Shenzhen</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>PowerChina Huadong Engineering Corporation Limited</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1515255/overview">Mohamed Hasnain Isa</ext-link>, University of Technology Brunei, Brunei</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/969644/overview">An Liu</ext-link>, Shenzhen University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1210559/overview">Chandra Ojha</ext-link>, Indian Institute of Technology Roorkee, India</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Junguo Liu, <email>junguo.liu@gmail.com</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Water and Wastewater Management, a section of the journal Frontiers in Environmental Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>06</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>10</volume>
<elocation-id>887446</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>03</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>05</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Tian, Yu, Li, Ke, Liu, Luo and Tang.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Tian, Yu, Li, Ke, Liu, Luo and Tang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Climate change and rapid urbanization have made it difficult to predict the risk of pollution in cities under different types of rainfall. In this study, a data-driven approach to quantify the effects of rainfall characteristics on river pollution was proposed and applied in a case study of Shiyan River, Shenzhen, China. The results indicate that the most important factor affecting river pollution is the dry period followed by average rainfall intensity, maximum rainfall in 10&#xa0;min, total amount of rainfall, and initial runoff intensity. In addition, an artificial neural network model was developed to predict the event mean concentration (EMC) of COD in the river based on the correlations between rainfall characteristics and EMC. Compared to under light rain (&#x3c; 10&#xa0;mm/day), the predicted EMC was five times lower under heavy rain (25&#x2013;49.9&#xa0;mm/day) and two times lower under moderate rain (10&#x2013;24.9&#xa0;mm/day). By converting the EMC to chemical oxygen demand in the river, the pollution load under non-point-source runoff was estimated to be 497.6&#xa0;t/year (with an accuracy of 95.98%) in Shiyan River under typical rainfall characteristics. The results of this study can be used to guide urban rainwater utilization and engineering design in Shenzhen. The findings also provide insights for predicting the risk of rainfall-runoff pollution and developing related policies in other cities.</p>
</abstract>
<kwd-group>
<kwd>rainfall-runoff pollution</kwd>
<kwd>rainfall characteristics</kwd>
<kwd>EMC</kwd>
<kwd>integrated learning methods</kwd>
<kwd>ANN</kwd>
</kwd-group>
<contract-sponsor id="cn001">Science, Technology and Innovation Commission of Shenzhen Municipality<named-content content-type="fundref-id">10.13039/501100010877</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Rapid urbanization has adverse effects on the natural environment, especially in aquatic environments. Due to changes in the hydrological cycle and the high diversity of pollutants, urban rainfall-runoff pollution has become a major problem (<xref ref-type="bibr" rid="B20">Kammen and Sunter, 2016</xref>). Especially in the initial stage of rainfall, the river pollutant content is the highest in the entire runoff process, which is referred to as the first flush effect (<xref ref-type="bibr" rid="B12">Gnecco et al., 2005</xref>; <xref ref-type="bibr" rid="B9">Feng et al., 2017</xref>). Common contaminants of river mainly include suspended solids, nutrients and heavy metals which have a major effects on the water quality of urban rivers (<xref ref-type="bibr" rid="B30">Perera et al., 2019</xref>; <xref ref-type="bibr" rid="B40">Yang et al., 2021</xref>).</p>
<p>Rapid urbanization has increased the impervious areas in cities, thereby reducing rainwater infiltration and increasing the total amount of runoff into urban rivers and the pollution load of urban surface runoff (<xref ref-type="bibr" rid="B6">Chen et al., 2017</xref>; <xref ref-type="bibr" rid="B14">He et al., 2018</xref>). <xref ref-type="bibr" rid="B24">Li et al. (2021)</xref> found that human activity has contributed to long-term reductions in the total amount and frequency of weak precipitation and the significant increases in the total amount and frequency of heavy precipitation in China. Human activities such as land use and land cover change, the construction of dams and irrigation canals, and mining have altered urban river runoff (<xref ref-type="bibr" rid="B1">Adeyeri et al., 2020</xref>) and significantly affected the rainfall characteristics. Urban rainfall-runoff pollution has become the main cause of global urban water pollution (<xref ref-type="bibr" rid="B38">Wang et al., 2021</xref>). Thus, identifying the factors affecting this type of pollution is critically important for controlling urban river pollution.</p>
<p>To make timely predictions related to rainfall-runoff pollution with minimal data, researchers have begun to apply machine learning methods. These methods do not require a comprehensive understanding of the mechanism underlying the interactions between various parameters. These methods are also effective for simulating nonlinear and non-stationary hydrological environmental processes (<xref ref-type="bibr" rid="B34">Wang and Yao, 2013</xref>; <xref ref-type="bibr" rid="B3">Badrzadeh et al., 2015</xref>). Machine learning-based methods have shown advantages for the analysis of rainfall-runoff pollution, and with the development of data science, various machine learning methods have been explored and developed to predict rainfall-runoff pollution in urban rivers (<xref ref-type="bibr" rid="B18">Jeung et al., 2019</xref>). These methods including random forest (RF), gradient boosting decision tree (GBDT), and extreme gradient boosting (XGBoost) methods, which have been applied to analyze the relationships between rainfall characteristics and runoff pollution (<xref ref-type="bibr" rid="B39">Wu et al., 2014</xref>; <xref ref-type="bibr" rid="B37">Wang et al., 2015</xref>). RF algorithms have been used to rank the importance of multiple rainfall characteristics affecting the initial scouring effect of river runoff, revealing the following six most important characteristics: total rainfall amount; maximum rainfall intensity in 5&#xa0;min; rainfall duration; total amount of runoff; peak runoff; and average rainfall intensity (<xref ref-type="bibr" rid="B2">Alias et al., 2014</xref>; <xref ref-type="bibr" rid="B30">Perera et al., 2019</xref>). By using the boosting method, GBDT will integrate multiple decision trees (DT) for analysis, which has shown a good prediction performances (<xref ref-type="bibr" rid="B26">Liang et al., 2020</xref>). <xref ref-type="bibr" rid="B16">Huan et al. (2020)</xref> applied a GBDT method to select characteristic factors with strong effects on dissolved oxygen and used these factors as input data to reduce the time needed for calculations. <xref ref-type="bibr" rid="B19">Joslyn (2018)</xref> evaluated the performance of XGBoost in predicting nine water quality factors (each factor was separately predicted using the other eight factors) and obtained success rates ranging from 80% to 90%.</p>
<p>Rainfall characteristics can also significantly affect the concentrations of river pollutants (<xref ref-type="bibr" rid="B8">Feng et al., 2015</xref>; <xref ref-type="bibr" rid="B43">Zhang et al., 2021</xref>), and rainfall duration and rainfall intensity are two of the most important factors affecting hydrological processes (<xref ref-type="bibr" rid="B32">Ran et al., 2012</xref>). Rainfall-runoff pollution is also affected by other rainfall characteristics such as the total amount of rainfall, which can affect the scouring effect of runoff (<xref ref-type="bibr" rid="B27">Liu et al., 2014</xref>), and the dry period (<xref ref-type="bibr" rid="B44">Zhang, 2011</xref>; <xref ref-type="bibr" rid="B29">Pang et al., 2012</xref>). <xref ref-type="bibr" rid="B18">Jeung et al. (2019)</xref> assessed the effects of rainfall characteristics on water quality parameters in urban rivers and found that different water quality parameters were affected by different rainfall characteristics; for example, biochemical oxygen demand and chemical oxygen demand (COD) were closely related to rainfall intensity, whereas total organic carbon and total phosphorus were strongly affected by the dry period. <xref ref-type="bibr" rid="B12">Gnecco et al. (2005)</xref> analyzed the event mean concentrations (EMCs) of various pollutants in urban rivers and found a strong correlation between maximum rainfall intensity and EMC.</p>
<p>Although several previous studies have analyzed rainfall characteristics and their qualitative effects on rainfall-runoff pollution, few studies have quantitatively analyzed the effects of rainfall characteristics on its pollution. Neural network models including artificial neural network (ANN), convolutional neural network, and back-propagation neural network models can consider multiple rainfall features together to predict rainfall-runoff pollution (<xref ref-type="bibr" rid="B39">Wu et al., 2014</xref>; <xref ref-type="bibr" rid="B37">Wang et al., 2015</xref>; <xref ref-type="bibr" rid="B5">Chau, 2017</xref>; <xref ref-type="bibr" rid="B11">Fotovatikhah et al., 2018</xref>). Some researchers have used neural network models to generalize the complex relationships between rainfall characteristics and water quality parameters to enhance the accuracy of rainfall-runoff simulation and prediction (<xref ref-type="bibr" rid="B10">Fernandes et al., 2020</xref>). For example, ANN models can be used to accurately determine whether the surface water quality meets the criteria set by national regulations or quantify the characteristics of water bodies (<xref ref-type="bibr" rid="B28">Palani et al., 2008</xref>; <xref ref-type="bibr" rid="B33">Shi et al., 2018</xref>). Using rainfall characteristics such as rainfall duration and confluence area as inputs and EMC as a training target, a back-propagation neural network model showed high accuracy for evaluating the total amount of pollutants in rainwater runoff (<xref ref-type="bibr" rid="B35">Tian, 2016</xref>). <xref ref-type="bibr" rid="B42">Ye et al. (2020)</xref> summarized the characteristics of neural network models used in environmental pollution research and found that ANN models can significantly improve the efficiency of pollutant prediction in rivers.</p>
<p>The objectives of this study were to analyze the CODs of Shiyan River and Shiyan Reservoir and explore the relationships between COD and rainfall characteristics. To achieve these objectives, we: 1) ranked the importance of different rainfall characteristics in terms of their effects on rainfall-runoff pollution using various integrated learning methods; 2) quantified the relationships between rainfall characteristics and runoff pollution in Shiyan River using an ANN model; and 3) estimated the non-point-source pollution load based on the typical EMC in the Shiyan River. As verified in this paper, the data-driven method presented herein can quickly predict the COD of the river. The findings provide a reference for water quality analysis in other fields.</p>
</sec>
<sec id="s2">
<title>2 Data and Methods</title>
<sec id="s2-1">
<title>2.1 Study Area</title>
<p>Over the past 40&#xa0;years, precipitation and extreme precipitation in the western urban area of Shenzhen have increased. Changes in the underlying surface and rainfall characteristics have also affected the temporal and spatial distributions of non-point-source pollution. In this study, Shiyan River in Shenzhen, China is taken as a research case, as can be seen in <xref ref-type="fig" rid="F1">Figure 1</xref>. Shiyan River is located in Shiyan Street, Bao&#x2019;an District and is a first-level tributary in the Maozhou River Basin. The total length of Shiyan River is 10.44&#xa0;km, and the catchment area of the basin is 27.05&#xa0;km<sup>2</sup>. The Shiyan River eventually merges into the Shiyan Reservoir, which is one of the four major reservoirs in Shenzhen and one of the largest sources of drinking water in Bao&#x2019;an District. With the rapid economic development of Bao&#x2019;an District, Shiyan River and Shiyan Reservoir will play increasingly important roles in water supply.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Map of Shiyan River, Shenzhen, China.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>2.2 Data</title>
<p>The following data were used in this study. First, the hourly/daily/annual river discharge (m<sup>3</sup>/s) and COD data (mg/L) for Shiyan River from 2009 to 2012 were obtained from <xref ref-type="bibr" rid="B31">Qin et al. (2013)</xref>. We also used data from <xref ref-type="bibr" rid="B31">Qin et al. (2013)</xref> to select the most influential rainfall characteristics for EMC and build the ANN model based on rainfall characteristics to predict the EMC value. Rainfall-runoff data (mm/min) for 2013&#x2013;2018 were obtained from <xref ref-type="bibr" rid="B25">Li (2020)</xref>.</p>
<p>Due to the uncertainty of rainfall events, there is currently no uniform and clear criteria for classifying rainfall events. Based on recent research considering the effects of rainfall confluence time and rainfall duration, 180&#xa0;min was used as the minimum time interval between two rainfall events, and the cumulative rainfall of each event had to be greater than 3&#xa0;mm (<xref ref-type="bibr" rid="B17">Huang et al., 2021</xref>). According to the amount of rainfall in 24&#xa0;h, all rainfall events were divided into six categories: light rain (&#x3c; 10&#xa0;mm); moderate rain (10&#x2013;24.9&#xa0;mm); heavy rain (25&#x2013;49.9&#xa0;mm); torrential rain (50&#x2013;99.9&#xa0;mm); rainstorm (100&#x2013;249.9&#xa0;mm); and extraordinary rainstorm (&#x3e; 250&#xa0;mm). Based on the above definitions of rainfall event and rainfall type, we obtained the typical rainfall characteristics (total amount of rainfall, rainfall duration, maximum rainfall per minute, maximum rainfall in 10&#xa0;min, rainfall intensity, and dry period) for the study area and used them in the subsequent verification of the pollution load of Shiyan River (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Typical rainfall characteristics under different rainfall types (2013&#x2013;2018) (<xref ref-type="bibr" rid="B25">Li, 2020</xref>).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Rainfall characteristics</th>
<th align="center">Light rain</th>
<th align="center">Moderate rain</th>
<th align="center">Heavy rain</th>
<th align="center">Torrential rain</th>
<th align="center">Rainstorm</th>
<th align="center">Extraordinary rainstorm</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Total amount of rainfall (mm)</td>
<td align="char" char=".">4.03</td>
<td align="char" char=".">6.28</td>
<td align="char" char=".">17.11</td>
<td align="char" char=".">34.20</td>
<td align="char" char=".">96.34</td>
<td align="char" char=".">165.04</td>
</tr>
<tr>
<td align="left">Rainfall duration (min)</td>
<td align="char" char=".">108.82</td>
<td align="char" char=".">153.26</td>
<td align="char" char=".">239.43</td>
<td align="char" char=".">556.12</td>
<td align="char" char=".">761.93</td>
<td align="char" char=".">1698.12</td>
</tr>
<tr>
<td align="left">Maximum rainfall per minute (mm)</td>
<td align="char" char=".">0.32</td>
<td align="char" char=".">0.49</td>
<td align="char" char=".">1.06</td>
<td align="char" char=".">1.58</td>
<td align="char" char=".">1.63</td>
<td align="char" char=".">1.75</td>
</tr>
<tr>
<td align="left">Maximum rainfall in 10&#xa0;min (mm)</td>
<td align="char" char=".">0.92</td>
<td align="char" char=".">1.83</td>
<td align="char" char=".">6.38</td>
<td align="char" char=".">7.74</td>
<td align="char" char=".">9.33</td>
<td align="char" char=".">13.76</td>
</tr>
<tr>
<td align="left">Rainfall intensity (mm/h)</td>
<td align="char" char=".">0.70</td>
<td align="char" char=".">1.03</td>
<td align="char" char=".">1.53</td>
<td align="char" char=".">2.03</td>
<td align="char" char=".">3.19</td>
<td align="char" char=".">4.03</td>
</tr>
<tr>
<td align="left">Dry period (h)</td>
<td align="char" char=".">34.00</td>
<td align="char" char=".">22.43</td>
<td align="char" char=".">20.10</td>
<td align="char" char=".">22.10</td>
<td align="char" char=".">26.30</td>
<td align="char" char=".">14.67</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-3">
<title>2.3 Methods</title>
<p>As shown in <xref ref-type="fig" rid="F2">Figure 2</xref>, we first processed the minute-level rainfall data (2013&#x2013;2018) into different rainfall characteristics (total amount of rainfall, rainfall duration, maximum rainfall per minute, maximum rainfall in 10&#xa0;min, rainfall intensity, and dry period). Subsequently, we identified the rainfall characteristics that most strongly affect EMC using mathematical statistical methods and three integrated learning methods (RF, GBDT, and XGBoost). Next, we developed an ANN model to predict the EMC values of Shiyan River by inputting typical rainfall characteristics under different rainfall types in terms of rainfall intensity per 24&#xa0;h (namely, light rain, moderate rain, heavy rain, and torrential rain). Finally, we calculated and verified the runoff pollution load of the Shiyan Reservoir using the predicted EMC value.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Research framework for this study.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g002.tif"/>
</fig>
<sec id="s2-3-1">
<title>2.3.1 Integrated Learning Methods</title>
<p>The integrated learning methods mainly completes research tasks by building and combining multiple different approaches, which can have a high accuracy rate. In this study, three widely used integrated learning algorithms (RF, GBDT, and XGBoost) were used to analyze the importance of various rainfall characteristics. RF is one of the most popular algorithms for solving classification and regression problems in recent years, with extremely high accuracy. GBDT can process a wide range of data types, and tuning parameter is relatively easy. XGBoost is efficient and flexible, which prevent overfitting and reduce model complexity.</p>
<sec id="s2-3-1-1">
<title>2.3.1.1 Random Forest</title>
<p>RF is a method for accurately classifying large amounts of data by creating multiple decision trees. The RF algorithm consists of a combination of tree classifiers where each classifier is generated using a random vector sampled independently from the input vector, and each tree casts a unit vote for the most popular class to classify an input vector. The decision trees use the CART algorithm to select variables based on the splitting criteria of the root node and make judgments based on the characteristic evaluation standard; the root node recursively generates child nodes through the internal node. The internal nodes represent the judgments of the characteristics, and each child node represents a regression result. Random attributes are introduced into the training process of decision trees, and the results are determined by the predicted mean values of multiple decision trees. Averaging can alleviate the problem of high variance and high deviation by finding a natural balance between the two extremes. Because RFs are often used as black-box models, they can generate reasonable predictions for data without configuration.</p>
</sec>
<sec id="s2-3-1-2">
<title>2.3.1.2 Gradient Boosting Decision Tree</title>
<p>GBDT is a characteristics selection method with high interpretability. GBDT has high nonlinear processing ability when considering the interactions of multiple groups of characteristics (<xref ref-type="bibr" rid="B16">Huan et al., 2020</xref>). GBDT is a powerful machine learning tool consisting of three parts: regression decision tree, gradient boosting, and shrinkage. GBDT is based on the linear combination of basic functions; multiple rounds of iteration are performed, and each round of iteration produces a weak classifier (regression decision tree). Each classifier is trained based on the gradient of the previous classifiers, and the accuracy of the result is continuously improved by reducing the deviation. The algorithm aims to obtain a set of decision rules using the original characteristics as input to create a new decision tree (<xref ref-type="bibr" rid="B15">He et al., 2014</xref>).</p>
</sec>
<sec id="s2-3-1-3">
<title>2.3.1.3 Extreme Gradient Boosting</title>
<p>XGBoost is an integrated machine learning algorithm based on decision trees that uses a gradient boosting framework. XGBoost has been widely used for regression, classification, and other applications. The core idea of XGBoost is to increase the number of decision trees by continuously splitting characteristics. Every time a tree is added, a new function <italic>f</italic>(<italic>x</italic>) is learned to fit the residual of the last prediction. When the training is completed, resulting in <italic>k</italic> trees, the score of a sample is predicted based on the characteristics of this sample, and the score corresponding to each tree is added to the predicted value of the sample. This method uses normalization in the objective function to prevent overfitting and reduce the complexity of the model.</p>
</sec>
</sec>
<sec id="s2-3-2">
<title>2.3.2 Artificial Neural Network Models</title>
<p>ANN models are networks of parallel distributed information processing systems that link input vectors to output vectors. They are composed of many information processing elements called neurons or nodes (<xref ref-type="bibr" rid="B4">Bisht et al., 2013</xref>). ANNs are mainly composed of three parts: the input layer, hidden layer, and output layer. The input layer primarily provides input data for the ANN model, and the hidden layer performs various transformations of the data (fitting the data by adjusting the function type and the number of neurons in the hidden layer), thus enhancing the network&#x2019;s ability to simulate complex functions. The output layer is considered to be a summary of the parallel calculation results performed by the hidden layer. The result of each neuron is the input of neurons existing in the next layer of the network, and the result of the output layer can be compared with the observed result (<xref ref-type="bibr" rid="B13">Haghiabi et al., 2018</xref>). Because the model is relatively simple and convenient for practical applications and prediction, it is a powerful tool for modeling many nonlinear hydrological processes; for example, ANN models have proven effective for use in the fields of water quality analysis and prediction.</p>
</sec>
<sec id="s2-3-3">
<title>2.3.3 Definition of Event Mean Concentration</title>
<p>Rainfall-runoff pollution events are characterized by uncertainty, and river runoff pollution is affected by factors such as the rainfall characteristics and underlying surface types. Instantaneous pollution concentrations do not accurately capture the characteristics of runoff pollution (<xref ref-type="bibr" rid="B22">Lee et al., 2011</xref>), it is necessary to find a variable to describe the pollution concentration in each rainfall-runoff pollution event. Therefore, in each event, COD was used to characterize water quality, and the degree of rainfall-runoff pollution was analyzed based on the event mean concentration (EMC) (<xref ref-type="bibr" rid="B21">Kim et al., 2007</xref>), which was calculated as the following equation (EMC formula):<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mtext>EMC</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mi>M</mml:mi>
<mml:mi>V</mml:mi>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x222b;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mi>T</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x222b;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mi>T</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>Q</mml:mi>
<mml:mi>t</mml:mi>
</mml:msub>
<mml:mi>d</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>Where: EMC &#x3d; event mean concentration, mg/L; M &#x3d; amount of pollutant, mg/L; V &#x3d; runoff volume, m<sup>3</sup>; T &#x3d; rainfall duration, s; C<sub>t</sub> &#x3d; concentration of pollutant over time, mg/L; and <italic>Q</italic>
<sub>
<italic>t</italic>
</sub> &#x3d; flow rate over time, m<sup>3</sup>/s.</p>
</sec>
<sec id="s2-3-4">
<title>2.3.4 Model for Estimating Rainfall-Runoff Pollution</title>
<p>Due to the randomness of surface runoff discharge, the annual pollution load is usually to estimate the pollution load concentration of urban surface runoff, that is, the total amount of pollutants discharged from surface runoff caused by multiple rainfall events in a year (<xref ref-type="bibr" rid="B23">Li et al., 2010</xref>). The annual non-point-source runoff pollution load of Shiyan River was estimated based on the EMC values under typical rainfall characteristics. This estimation method has been widely used both within and outside of China (<xref ref-type="bibr" rid="B36">Wang, 2015</xref>). The annual runoff pollution load based on the EMC of the site was calculated using the following formula:<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mi>L</mml:mi>
<mml:mi>y</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>F</mml:mi>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>&#x3c8;</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>A</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>C</mml:mi>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>where: <italic>L</italic>
<sub>
<italic>y</italic>
</sub> &#x3d; annual pollution load, t; <italic>C<sub>F</sub>
</italic> &#x3d; proportion of rainfall events that produce runoff, usually taken when data are lacking, 0.9 was the empirical coefficient (<xref ref-type="bibr" rid="B36">Wang, 2015</xref>); <italic>&#x3a8;</italic> &#x3d; runoff coefficient; <italic>A</italic> &#x3d; catchment area, km<sub>2</sub>; <italic>P</italic> &#x3d; average annual rainfall, mm; and <italic>C</italic> &#x3d; EMC, mg/L.</p>
</sec>
</sec>
</sec>
<sec id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Effects of Rainfall Characteristics on Event Mean Concentration</title>
<p>In this study, Shiyan River and Shiyan Reservoir were taken as typical research areas to explore the correlation between rainfall characteristics and runoff pollution. COD was used as a typical metric for pollution analysis. For convenience, the EMC formula was used to convert COD to EMC. Due to the low frequency of rainstorms and extraordinary rainstorms (0.03 and 0.01, respectively), these rainfall types were combined with torrential rainfall events in this analysis.</p>
<p>
<xref ref-type="fig" rid="F3">Figure 3</xref> shows the relationships between rainfall type and EMC based on rainfall data from 26 rainfall events (2009&#x2013;2012). The vertical axis of the box plot represents the degree of data dispersion, and the center represents the typical distribution probability of EMC. Therefore, the typical value of EMC represents the location corresponding to the maximum distribution probability. In general, the typical EMC value is largest during light rain; the EMC during light rain (based on the median value) was almost four times higher than that during moderate rain, which was associated with the lowest EMC. Meanwhile, the EMC values corresponding to heavy rain and torrential rain were much lower than that for light rain.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>EMC values under different rainfall types.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g003.tif"/>
</fig>
<p>Evaluating the effect of rainfall type on EMC requires analyzing the effects of different rainfall characteristics on EMC. In the case of light rain, the initial stage of rainfall will wash urban surface pollutants into the river, increasing the EMC. During moderate rain, rainfall runoff gradually increases, and the pollutants washed into the river channel change little, which reduces the EMC to a large degree. For heavy rain and torrential rain, the erosion of the river channel may wash pollutants from the deep layers of the ground into the river channel, resulting in a gradual increase in EMC.</p>
<p>Principal component analysis (PCA) was used to identify the correlations between rainfall characteristics and EMC. <xref ref-type="fig" rid="F4">Figure 4</xref> shows the results of the PCA of rainfall characteristics and EMC. PC1 and PC2 explained 42% and 20.5% of the total variance of the data, respectively. The proportion contributed by each rainfall characteristic to PC1 and PC2 can be obtained from the directions and lengths of the blue arrows in <xref ref-type="fig" rid="F4">Figure 4</xref>. Most of the scattered points in <xref ref-type="fig" rid="F4">Figure 4</xref> are within the 95% confidence interval (shown by the red circle), which indicates that there were no obvious extreme values. A correlation matrix was used to calculate the correlation coefficients between EMC and the rainfall characteristics (<xref ref-type="fig" rid="F5">Figure 5</xref>). In <xref ref-type="fig" rid="F5">Figure 5</xref>, red and blue represent positive and negative correlations, respectively, and the intensity of the color indicates the strength of the correlation. Among the rainfall characteristics, dry period showed the strongest correlation with EMC (correlation coefficient &#x3d; 0.5). Average rainfall intensity was negatively correlated with EMC (correlation coefficient &#x3d; &#x2212;0.13). The initial, average, and maximum runoff intensities were highly correlated. If the angle between the two rainfall eigenvalues in <xref ref-type="fig" rid="F4">Figure 4</xref> was less than 30&#xb0;, and the correlation coefficient was greater than 0.8 in <xref ref-type="fig" rid="F5">Figure 5</xref>, we considered the correlation between two variables to be significant. Using these criteria, no significant correlations were observed between EMC and any single rainfall characteristic. Thus, it was necessary further analyze the data to reveal the relationships between multiple rainfall characteristics and EMC.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>PCA results between rainfall characteristics and EMC. PC1 and PC2 represent 42% and 20.5% of the total variance of the data, respectively. Red dots represent the scores of rainfall events. The red circle represents the 95% confidence interval. The blue arrows represent the proportions contributed by rainfall characteristics to PC1 and PC2.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Correlations between rainfall characteristics and EMC. Red and blue squares represent positive and negative correlations between two characteristics, respectively. Deeper color indicates a stronger correlation.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g005.tif"/>
</fig>
<p>Using six rainfall characteristics (dry period, total amount of rainfall, average rainfall intensity, rainfall duration, maximum rainfall intensity in 10&#xa0;min, and initial runoff intensity), we performed multiple linear regression fitting for EMC. <xref ref-type="fig" rid="F6">Figure 6</xref> shows the relationships between EMC and various rainfall characteristics. Each black dot represents the EMC value of a rainfall event, and each figure contains 26 rainfall events. By constructing a linear fitting curve, we can observe the effects of different rainfall characteristics on EMC. In <xref ref-type="fig" rid="F6">Figure 6</xref>, the dark orange range represents the 95% confidence interval between different rainfall characteristics and EMC, while the light orange range represents the 95% prediction interval between them. A positive correlation was observed between the dry period and EMC, while EMC gradually decreased as the initial runoff intensity increased. As the total amount of rainfall increased, EMC first decreased and then increased; a similar trend in EMC was observed for the maximum rainfall intensity. Thus, EMC showed different relationships with the various rainfall characteristics.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Relationship between EMC and rainfall characteristics. Each black dot represents the EMC value of a rainfall event. The dark orange range represents the 95% confidence interval, while the light orange range represents the 95% prediction interval.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g006.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 Analysis of the Relative Importance of Different Rainfall Characteristics in Determining Event Mean Concentration</title>
<p>Three widely used machine learning algorithms (RF, GBDT, and XGBoost) were used to analyze the relative importance of rainfall characteristics affecting runoff pollution (<xref ref-type="fig" rid="F7">Figure 7</xref>). The most important rainfall characteristic affecting EMC was the dry period followed by the average rainfall intensity, the maximum rainfall in 10&#xa0;min, the total amount of rainfall, and the initial runoff intensity. The high importance of the dry period may be related to the accumulation of surface pollutants during dry periods. During rainfall after an extended dry period, large quantities of pollutants are washed into the river, causing the EMC in the river to increase. However, due to the large differences in rainfall duration observed in the data, the effect of rainfall duration on EMC was relatively weak. The risk of runoff pollution was quantified by selecting the rainfall characteristics with the strongest effects on EMC based on the above analysis.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Importance rankings of different rainfall characteristics in terms of their effect on EMC based on GBDT, RF, and XGBoost algorithms.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g007.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>3.3 Construction and Analysis of the Prediction Model</title>
<p>Analyzing the input data improves the interpretability of the input data for neural network models. We established a model to predict runoff pollution from rainfall characteristics based on the relative importance of different rainfall characteristics and the availability of actual forecast data. The model considered the five rainfall characteristics with the strongest effects on EMC (i.e., dry period, average rainfall intensity, maximum rainfall in 10 min, total amount of rainfall, and initial runoff intensity), and the corresponding EMC values were used as the training targets. A total of 70% of the original data was used to train the ANN model, while the remaining 30% of the original data was used to verify the ANN model.</p>
<p>
<xref ref-type="fig" rid="F8">Figure 8</xref> shows the training performance of the ANN model. The model training performance was 0.976, the test performance was 0.989, and the verification performance was 0.883. It also can be found that most of these scattered points are clustered near the fitted line from <xref ref-type="fig" rid="F8">Figure 8</xref>, which show that the response results of this model are good; thus, the model can be used to predict EMC. The frequencies of rainstorms and extraordinary rainstorms were extremely low; thus, these rainfall types were ignored in the analysis of runoff pollution. Therefore, the typical EMC values for each rainfall characteristic under the other four rainfall types were used to predict EMC.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Plot showing the ANN training performance.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g008.tif"/>
</fig>
<p>Under typical rainfall characteristics, the predicted EMC value was highest under the light rain scenario (2612.20&#xa0;mg/L), and this EMC was approximately two times the predicted EMC under moderate rain (<xref ref-type="table" rid="T2">Table 2</xref>). The EMC prediction values for heavy rain and torrential rain were almost the same (both were one-fifth of the predicted EMC value for light rain). This may be explained by the fact that the dry period under the light rain scenario was typically longer than that under other rain types; thus, the dilution effect of pollutants washing into the river channel during light rain was weak. The dilution effect of heavy and moderate rain was more pronounced; under the torrential rain scenario, the predicted EMC value increased slowly because of the stronger effects of rainfall duration and runoff area. Rainfall events following long dry periods and light rain events require additional attention, and measures should be enacted in a timely manner to prevent water pollution.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Effects of typical rainfall characteristics on EMC.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Rainfall characteristics</th>
<th align="center">Light rain</th>
<th align="center">Moderate rain</th>
<th align="center">Heavy rain</th>
<th align="center">Torrential rain</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Dry period (h)</td>
<td align="char" char=".">34.00</td>
<td align="char" char=".">22.43</td>
<td align="char" char=".">20.10</td>
<td align="char" char=".">22.10</td>
</tr>
<tr>
<td align="left">Rainfall depth (mm)</td>
<td align="char" char=".">4.03</td>
<td align="char" char=".">6.28</td>
<td align="char" char=".">17.11</td>
<td align="char" char=".">34.20</td>
</tr>
<tr>
<td align="left">Maximum rainfall in 10&#xa0;min (mm)</td>
<td align="char" char=".">0.92</td>
<td align="char" char=".">1.83</td>
<td align="char" char=".">6.38</td>
<td align="char" char=".">7.74</td>
</tr>
<tr>
<td align="left">Rainfall intensity (mm/h)</td>
<td align="char" char=".">0.70</td>
<td align="char" char=".">1.03</td>
<td align="char" char=".">1.53</td>
<td align="char" char=".">2.03</td>
</tr>
<tr>
<td align="left">Initial runoff (m<sup>3</sup>/s)</td>
<td align="char" char=".">0.76</td>
<td align="char" char=".">0.94</td>
<td align="char" char=".">2.07</td>
<td align="char" char=".">1.40</td>
</tr>
<tr>
<td align="left">Frequency</td>
<td align="char" char=".">0.20</td>
<td align="char" char=".">0.37</td>
<td align="char" char=".">0.18</td>
<td align="char" char=".">0.11</td>
</tr>
<tr>
<td align="left">EMC (mg/L)</td>
<td align="char" char=".">2612.20</td>
<td align="char" char=".">1404.50</td>
<td align="char" char=".">596.24</td>
<td align="char" char=".">649.50</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The annual pollution load of non-point-source runoff for Shiyan River was estimated based on the predicted EMC values under typical rainfall characteristics (<xref ref-type="table" rid="T1">Table 1</xref>). EMC was used to approximate the annual runoff pollution load. Given that the traditional method of EMC value selection is relatively random, the predicted EMC values under typical rainfall events should be used. Hence, the estimation of rainfall-runoff pollution load considered the predicted values of EMC under typical rainfall events along with the probabilities of different rainfall patterns. The proportion of runoff events was 0.9, and the multi-year runoff depth of Shiyan River was 860&#xa0;mm (average runoff depth is the product of the runoff coefficient and annual average rainfall). The EMC under different rainfall pattern was predicted based on the typical rainfall characteristics of the model, then the actual EMC value of this river can be obtained by weighted average of the probability values of different rainfall pattern, which was 1460&#xa0;mg/L. Thus, according to the conversion of <xref ref-type="disp-formula" rid="e2">Eq. 2</xref>, the annual non-point-source COD pollution load was calculated to be 497.6&#xa0;t. The annual non-point-source pollution load of COD in the built-up area of Shiyan Reservoir was previously reported to be 477&#xa0;t (<xref ref-type="bibr" rid="B41">Yang et al., 2013</xref>), indicating an estimation accuracy for our model of 95.98%.</p>
</sec>
</sec>
<sec id="s4">
<title>4 Conclusion and Discussion</title>
<p>Integrated learning methods were used to analyze the relationships between rainfall characteristics and EMC for Shiyan River. Rainfall characteristics were then used to predict the water quality by constructing an ANN model. The main findings are summarized below.</p>
<p>PCA of the rainfall characteristics revealed no significant correlations between rainfall characteristics. A positive correlation was observed between rainfall dry period and EMC, while EMC was negatively correlated with initial runoff intensity. Using mathematical statistical analysis and a variety of machine learning algorithms, we qualitatively described and ranked the effects of different rainfall characteristics on EMC. Among all rainfall characteristics, the dry period was the most important factor influencing EMC. This can be attributed to the build-up of surface pollutants as the dry period becomes longer. When rainfall occurs after a long dry period, large quantities of pollutants are washed into the river, causing EMC to increase. After dry period, the next most important rainfall characteristics were average rainfall intensity, maximum rainfall in 10&#xa0;min, total amount of rainfall, and initial runoff intensity.</p>
<p>A model to predict EMC based on rainfall characteristics was constructed using the above five most influential rainfall characteristics as inputs, which greatly improved the interpretability of the neural network and the accuracy of the ANN model. The model training performance was 0.976, the test performance was 0.989, and the verification performance was 0.883. The prediction results under typical rainfall characteristics revealed that the runoff pollution caused by light rain is approximately two times that under moderate rain and five times that under heavy rain. Based on the predicted EMC values under typical rainfall characteristics, the annual non-point-source runoff pollution load of Shiyan River was estimated to be 497.6&#xa0;t. The accuracy of the estimation method was 95.98%, indicating the robustness of the model.</p>
<p>We acknowledge that there are several limitations of this study. The relatively short time scale of the high-precision rainfall data in Shenzhen precludes a more in-depth study of future rainfall characteristics and trends under the influence of climate change. Because of the difficulty in monitoring rainfall-runoff pollution, the total number of samples used in this study was only 26 rainfall events. In order to prove the credibility of the results, we use RF and XGBoost methods to study this data. As can be seen in <xref ref-type="fig" rid="F9">Figure 9</xref>, the simulation results of these two methods are good. The values of the coefficients of determination (r<sup>2</sup>) obtained by RF and XGBoost methods are 0.879 and 0.914, which are similar to the results we predicted by ANN model (0.9). These results also prove that our findings are still reliable. Of course, subsequent studies should collect data over a longer time scale and consider the effects of land use and other factors on water quality/runoff pollution. The focus of this study was the relationships between rainfall characteristics and runoff pollution. Machine learning models can also be used to integrate rainfall and runoff data in future research.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Plot showing the training performance by RF and XGBoost.</p>
</caption>
<graphic xlink:href="fenvs-10-887446-g009.tif"/>
</fig>
<p>The results of this study have implications for the utilization of urban rainwater and resources, engineering design, predicting rainfall-runoff pollution risk, and policy development.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>ZT: Conceptualization, Discussion, Supervision, Writing (review and editing); ZY: Data curation, Planning, Writing (original draft); YL: Methodology, Data curation, Discussion; QK: Discussion, Writing (review and editing); JL: Conceptualization, Discussion, Supervision, Writing (review and editing); HL: Data provision, Discussion; YT: Data provision, Discussion. All authors read and approved the final manuscript.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This study was supported by the Science, Technology and Innovation Commision of Shenzhen Municipality (JCYJ20210324104004013). It was also supported by the National Key R&#x0026;D Program of China (No. 2018YFE0206200).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>Author YT was employed by the company PowerChina Huadong Engineering Corporation Limited.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We acknowledge Aifang Chen, Wenfang Cao and Yanlong Guan of the iTOWER group for discussion and Pengfei Wang of the Southern University of Science and Technology for modifying graphs. We also acknowledge Xingxing Huang of the Shanghai Institute of Technology for his help.</p>
</ack>
<ref-list>
<title>Reference</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adeyeri</surname>
<given-names>O. E.</given-names>
</name>
<name>
<surname>Laux</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lawin</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Arnault</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessing the Impact of Human Activities and Rainfall Variability on the River Discharge of Komadugu-Yobe Basin, Lake Chad Area</article-title>. <source>Environ. Earth Sci.</source> <volume>79</volume> (<issue>6</issue>), <fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1007/s12665-020-8875-y</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alias</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Goonetilleke</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Egodawatta</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Time as the Critical Factor in the Investigation of the Relationship between Pollutant Wash-Off and Rainfall Characteristics</article-title>. <source>Ecol. Eng.</source> <volume>64</volume>, <fpage>301</fpage>&#x2013;<lpage>305</lpage>. <pub-id pub-id-type="doi">10.1016/j.ecoleng.2014.01.008</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Badrzadeh</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sarukkalige</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Jayawardena</surname>
<given-names>A. W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Hourly Runoff Forecasting for Flood Risk Management: Application of Various Computational Intelligence Models</article-title>. <source>J. Hydrology</source> <volume>529</volume>, <fpage>1633</fpage>&#x2013;<lpage>1643</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2015.07.057</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bisht</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Jain</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Raju</surname>
<given-names>M. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Prediction of Water Table Eevation Fluctuation through Fuzzy Logic &#x26; Artificial Neural Networks</article-title>. <source>Int. J. Adv. Sci. Technol.</source> <volume>51</volume>, <fpage>107</fpage>&#x2013;<lpage>120</lpage>. </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chau</surname>
<given-names>K.-w.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Use of Meta-Heuristic Techniques in Rainfall-Runoff Modelling</article-title>. <source>Water</source> <volume>9</volume> (<issue>3</issue>), <fpage>186</fpage>. <pub-id pub-id-type="doi">10.3390/w9030186</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Theller</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gitau</surname>
<given-names>M. W.</given-names>
</name>
<name>
<surname>Engel</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Harbor</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Urbanization Impacts on Surface Runoff of the Contiguous United States</article-title>. <source>J. Environ. Manag.</source> <volume>187</volume>, <fpage>470</fpage>&#x2013;<lpage>481</lpage>. <pub-id pub-id-type="doi">10.1016/j.jenvman.2016.11.017</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Mi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Di</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Analysis of Road Runoff Pollution in Northern City Based on the Typical Rainfall</article-title>. <source>Ecol. Environ. Sci.</source> <volume>24</volume> (<issue>3</issue>), <fpage>418</fpage>&#x2013;<lpage>426</lpage>. <pub-id pub-id-type="doi">10.16258/j.cnki.1674-5906.2015.03.008</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mingming</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Muhua</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Analysis of Pollution Characteristics and First Flush Effect in Rainfall Runoff in Separate Storm Sewer System in Upstream of Tangxi River,Chaohu Catchment</article-title>. <source>Hupo Kexue/Journal Lake Sci.</source> <volume>29</volume> (<issue>2</issue>), <fpage>285</fpage>&#x2013;<lpage>296</lpage>. <pub-id pub-id-type="doi">10.18307/2017.0204</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fernandes</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chaves</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lima</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Neves</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Vicente</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Draw on Artificial Neural Networks to Assess and Predict Water Quality</article-title>. <source>IOP Conf. Ser. Earth Environ. Sci.</source> <volume>612</volume> (<issue>1</issue>), <fpage>012028</fpage>. <pub-id pub-id-type="doi">10.1088/1755-1315/612/1/012028</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fotovatikhah</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Herrera</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shamshirband</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chau</surname>
<given-names>K.-w.</given-names>
</name>
<name>
<surname>Faizollahzadeh Ardabili</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Piran</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Survey of Computational Intelligence as Basis to Big Flood Management: Challenges, Research Directions and Future Work</article-title>. <source>Eng. Appl. Comput. Fluid Mech.</source> <volume>12</volume> (<issue>1</issue>), <fpage>411</fpage>&#x2013;<lpage>437</lpage>. <pub-id pub-id-type="doi">10.1080/19942060.2018.1448896</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gnecco</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Berretta</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lanza</surname>
<given-names>L. G.</given-names>
</name>
<name>
<surname>La Barbera</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Storm Water Pollution in the Urban Environment of Genoa, Italy</article-title>. <source>Atmos. Res.</source> <volume>77</volume> (<issue>1&#x2013;4</issue>), <fpage>60</fpage>&#x2013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/j.atmosres.2004.10.017</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Haghiabi</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Nasrolahi</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Parsaie</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Water Quality Prediction Using Machine Learning Methods</article-title>. <source>Water Qual. Res. J.</source> <volume>53</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.2166/wqrj.2018.025</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Analysis of the Temporal and Spatial Characteristics of Rainfall-Runoff Pollution in Dianbei Basin of Shanghai</article-title>. <source>Acta Sci. Circumstantiae</source> <volume>38</volume> (<issue>2</issue>), <fpage>536</fpage>&#x2013;<lpage>545</lpage>. <pub-id pub-id-type="doi">10.13671/j.hjkxxb.2017.0338</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Bowers</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Candela</surname>
<given-names>J. Q.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). &#x201c;<article-title>Practical Lessons from Predicting Clicks on Ads at Facebook</article-title>,&#x201d; in <conf-name>Proceedings of the Eighth International Workshop on Data Mining for Online Advertising (ADKDD&#x2019;14)</conf-name>, <conf-loc>Menlo Park, CA</conf-loc>, <conf-date>August 24, 2014</conf-date> (<publisher-name>ADKDD&#x2019;14</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1145/2648584.2648589</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of Dissolved Oxygen in Aquaculture Based on Gradient Boosting Decision Tree and Long Short-Term Memory Network: A Study of Chang Zhou Fishery Demonstration Base, China</article-title>. <source>Comput. Electron. Agric.</source> <volume>175</volume>, <fpage>105530</fpage>. <pub-id pub-id-type="doi">10.1016/j.compag.2020.105530</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ke</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Evaluation of Short-Term Streamflow Prediction Methods in Urban River Basins</article-title>. <source>Phys. Chem. Earth, Parts A/B/C</source> <volume>123</volume>, <fpage>103027</fpage>. <pub-id pub-id-type="doi">10.1016/j.pce.2021.103027</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeung</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Baek</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Beom</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>K. H.</given-names>
</name>
<name>
<surname>Her</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yoon</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Evaluation of Random Forest and Regression Tree Methods for Estimation of Mass First Flush Ratio in Urban Catchments</article-title>. <source>J. Hydrology</source> <volume>575</volume>, <fpage>1099</fpage>&#x2013;<lpage>1110</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2019.05.079</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Joslyn</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Water Quality Factor Prediction Using Supervised Machine Learning Citation Details</article-title>. <comment>REU Final Report</comment>. <comment>AvaliableAt: <ext-link ext-link-type="uri" xlink:href="https://archives.pdx.edu/ds/psu/26231">https://archives.pdx.edu/ds/psu/26231</ext-link> (Accessed November 20, 2021)</comment>. </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kammen</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Sunter</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>City-integrated Renewable Energy for Urban Sustainability</article-title>. <source>Science</source> <volume>352</volume> (<issue>6288</issue>), <fpage>922</fpage>&#x2013;<lpage>928</lpage>. <pub-id pub-id-type="doi">10.1126/science.aad9302</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chung</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Water Quality of Runoff from Agricultural-Forestry Watersheds in the Geum River Basin, Korea</article-title>. <source>Environ. Monit. Assess.</source> <volume>134</volume> (<issue>1&#x2013;3</issue>), <fpage>441</fpage>&#x2013;<lpage>452</lpage>. <pub-id pub-id-type="doi">10.1007/s10661-007-9635-0</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>M. Y.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Characteristics of the Event Mean Concentration (EMC) from Rainfall Runoff on an Urban Highway</article-title>. <source>Environ. Pollut.</source> <volume>159</volume> (<issue>4</issue>), <fpage>884</fpage>&#x2013;<lpage>888</lpage>. <pub-id pub-id-type="doi">10.1016/j.envpol.2010.12.022</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Study on the Calculation Method for Urban Surface Runoff Pollution Load</article-title>. <source>J. Water Res. Water Eng.</source> <volume>21</volume> (<issue>2</issue>), <fpage>5</fpage>&#x2013;<lpage>13</lpage>. </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The Emergence of Anthropogenic Signal in Mean and Extreme Precipitation Trend over China by Using Two Large Ensembles</article-title>. <source>Environ. Res. Lett.</source> <volume>16</volume> (<issue>1</issue>), <fpage>014052</fpage>. <pub-id pub-id-type="doi">10.1088/1748-9326/abd26d</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <source>Analysis of Rainfall Characteristics and Their Influence on Runoff and Water Quality in Maozhou River</source>. <comment>Master&#x2019;s Thesis</comment>. <publisher-loc>Harbin (China)</publisher-loc>. <publisher-name>Harbin Institute of Technology</publisher-name>. </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predicting Hard Rock Pillar Stability Using GBDT, XGBoost, and LightGBM Algorithms</article-title>. <source>Mathematics</source> <volume>8</volume> (<issue>5</issue>), <fpage>765</fpage>. <pub-id pub-id-type="doi">10.3390/math8050765</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Guan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Impact of Catchment and Rainfall Characteristics on Urban Runoff Quality</article-title>. <source>J. Tsinghua Univ (Sci Technol)</source> <volume>54</volume> (<issue>7</issue>), <fpage>846</fpage>&#x2013;<lpage>852</lpage>. <pub-id pub-id-type="doi">10.16511/j.cnki.qhdxxb.2014.07.004</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Palani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liong</surname>
<given-names>S.-Y.</given-names>
</name>
<name>
<surname>Tkalich</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>An ANN Application for Water Quality Forecasting</article-title>. <source>Mar. Pollut. Bull.</source> <volume>56</volume> (<issue>9</issue>), <fpage>1586</fpage>&#x2013;<lpage>1597</lpage>. <pub-id pub-id-type="doi">10.1016/j.marpolbul.2008.05.021</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Nonpoint Source Pollution from Urban Runoff and Pollution Abatement in Urban Waterways</article-title>. <source>Environ. Sci. Technol.</source> <volume>35</volume> (<issue>12</issue>), <fpage>2</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.3969/j.issn.1003-6504.2012.12.037</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perera</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>McGree</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Egodawatta</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Jinadasa</surname>
<given-names>K. B. S. N.</given-names>
</name>
<name>
<surname>Goonetilleke</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Taxonomy of Influential Factors for Predicting Pollutant First Flush in Urban Stormwater Runoff</article-title>. <source>Water Res.</source> <volume>166</volume>, <fpage>115075</fpage>. <pub-id pub-id-type="doi">10.1016/j.watres.2019.115075</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Frequency Analysis of Urban Runoff Quality in an Urbanizing Catchment of Shenzhen, China</article-title>. <source>J. Hydrology</source> <volume>496</volume>, <fpage>79</fpage>&#x2013;<lpage>88</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2013.04.053</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ran</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Experimental Study of the Impact of Rainfall Characteristics on Runoff Generation and Soil Erosion</article-title>. <source>J. Hydrology</source> <volume>424-425</volume>, <fpage>99</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2011.12.035</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Applying High-Frequency Surrogate Measurements and a Wavelet-ANN Model to Provide Early Warnings of Rapid Surface Water Quality Anomalies</article-title>. <source>Sci. Total Environ.</source> <volume>610-611</volume>, <fpage>1390</fpage>&#x2013;<lpage>1399</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2017.08.232</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Using Class Imbalance Learning for Software Defect Prediction</article-title>. <source>IEEE Trans. Rel.</source> <volume>62</volume> (<issue>2</issue>), <fpage>434</fpage>&#x2013;<lpage>443</lpage>. <pub-id pub-id-type="doi">10.1109/TR.2013.2259203</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tian</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2016</year>). <source>Research on Measurement and Evaluation Methods of Stormwater Runoff Pollution Load</source>. <comment>Master&#x2019;s Thesis</comment>. <publisher-loc>Beijing (China)</publisher-loc>: <publisher-name>Beijing University of Civil Engineering and Architecture</publisher-name>. </citation>
</ref>
<ref id="B36">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Pollution Characteristics Analysis and Pollution Load Estimation in Rainfall Runoff of Different Underlying Surface in Wuhan City</source>. <comment>Master&#x2019;s Thesis</comment>. <publisher-loc>Wuhan (China)</publisher-loc>: <publisher-name>Huazhong University of Science and Technology</publisher-name>. </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Lai</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Flood Hazard Risk Assessment Model Based on Random Forest</article-title>. <source>J. Hydrology</source> <volume>527</volume>, <fpage>1130</fpage>&#x2013;<lpage>1141</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2015.06.008</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Nan</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>How Do Urban Rainfall-Runoff Pollution Control Technologies Develop in China? A Systematic Review Based on Bibliometric Analysis and Literature Summary</article-title>. <source>Sci. Total Environ.</source> <volume>789</volume>, <fpage>148045</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2021.148045</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ng</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Ho</surname>
<given-names>S.-S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Forestexter: An Efficient Random Forest Algorithm for Imbalanced Text Categorization</article-title>. <source>Knowledge-Based Syst.</source> <volume>67</volume>, <fpage>105</fpage>&#x2013;<lpage>116</lpage>. <pub-id pub-id-type="doi">10.1016/j.knosys.2014.06.004</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A Novel Assessment Considering Spatial and Temporal Variations of Water Quality to Identify Pollution Sources in Urban Rivers</article-title>. <source>Sci. Rep.</source> <volume>11</volume>, <fpage>8714</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-87671-4</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Study on Pollution Load of Watershed in Shiyan Reservoirs in Shenzhen</article-title>. <source>Res. Conserv. Environ. Prot.</source> <volume>8</volume>, <fpage>174</fpage>. <pub-id pub-id-type="doi">10.16317/j.cnki.12-1377/x.2013.08.100</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Tu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Tackling Environmental Challenges in Pollution Controls Using Artificial Intelligence: A Review</article-title>. <source>Sci. Total Environ.</source> <volume>699</volume>, <fpage>134279</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2019.134279</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Che</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Pollutant First Flush Identification and its Implications for Urban Runoff Pollution Control: A Roof and Road Runoff Case Study in Beijing, China</article-title>. <source>Water Sci. Technol.</source> <volume>83</volume> (<issue>11</issue>), <fpage>2829</fpage>&#x2013;<lpage>2840</lpage>. <pub-id pub-id-type="doi">10.2166/wst.2021.157</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2011</year>). <source>Frequency Analysis of Rainfall Runoff Quality in Urbanizing Catchment: A Case Study of Shiyan River Catchment in Shenzhen</source>. <comment>Master&#x2019;s thesis</comment>. <publisher-loc>Beijing (China)</publisher-loc>: <publisher-name>Peking University</publisher-name>. </citation>
</ref>
</ref-list>
</back>
</article>