<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1222871</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2023.1222871</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Estimation of key potentially toxic elements in arid agricultural soils using Vis-NIR spectroscopy with variable selection and PLSR algorithms</article-title>
<alt-title alt-title-type="left-running-head">Nawar et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2023.1222871">10.3389/fenvs.2023.1222871</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Nawar</surname>
<given-names>Said</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1994406/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Mohamed</surname>
<given-names>Elsayed Said</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1841527/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Essam-Eldeen Sayed</surname>
<given-names>Safa</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mohamed</surname>
<given-names>Wagih S.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rebouh</surname>
<given-names>Nazih Y.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hammam</surname>
<given-names>Amr A.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2321117/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Soil and Water Department</institution>, <institution>Faculty of Agriculture</institution>, <institution>Suez Canal University</institution>, <addr-line>Ismailia</addr-line>, <country>Egypt</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>National Authority for Remote Sensing and Space Sciences</institution>, <addr-line>Cairo</addr-line>, <country>Egypt</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Soil Science Department</institution>, <institution>Faculty of Agriculture</institution>, <institution>Minia University</institution>, <addr-line>El-Minia</addr-line>, <country>Egypt</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Environmental Management</institution>, <institution>Institute of Environmental Engineering, RUDN University</institution>, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1110540/overview">Songchao Chen</ext-link>, ZJU-Hangzhou Global Scientific and Technological Innovation Center, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1119723/overview">Yuxin Ma</ext-link>, Manaaki Whenua Landcare Research, New Zealand</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1780033/overview">Dongyun Xu</ext-link>, Shandong Agricultural University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Said Nawar, <email>said.nawar@agr.suez.edu.eg</email>; Elsayed Said Mohamed, <email>salama55@mail.ru</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>07</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>11</volume>
<elocation-id>1222871</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>05</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>07</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Nawar, Mohamed, Essam-Eldeen Sayed, Mohamed, Rebouh and Hammam.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Nawar, Mohamed, Essam-Eldeen Sayed, Mohamed, Rebouh and Hammam</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Potentially toxic elements (PTEs) pose a significant threat to soil and the environment. Therefore, the fast quantification of PTEs is crucial for better management of contaminated sites. Versatile technique such as Visible near-infrared spectroscopy (Vis&#x2013;NIRS) (350&#x2013;2,500&#xa0;nm) has attracted tremendous attention for assessing PTEs and has achieved promising results combined with successful multivariate analysis. This research investigated the potential of Vis&#x2013;NIRS combined with partial least squares regression (PLSR) and variable selection methods to assess key PTEs (Cd, Co, Cu, Cr, Pb, and Zn) in agricultural soils under arid conditions. The soil samples (80) were collected from a polluted area around Al-Moheet drainage, Minya Governorate&#x2013;upper Egypt. The samples were scanned using an ASD FieldSpec-4 spectroradiometer. Simulated annealing (SA) and uninformative variable elimination (UVE) were used to select the effective wavelengths in predicting PTEs. PLSR was used to develop the spectral models using the full range (FR-PLS) and feature-selected spectra techniques SA (SA-PLS) and UVE (UVE-PLS). The results indicated that UVE-PLS models performed better than FR-PLS and SA-PLS models in predicting the key PTEs. The obtained coefficient of determination (R<sup>2</sup>) and the ratio of performance to deviation (RPD) were 0.74 and 2.48 (Cr), 0.72 and 2.03 (Pb), 0.62 and 1.86 (Cd), 0.59 and 1.78 (Cu), 0.52 and 1.68 (Co), and 0.46 and 1.41 (Zn), respectively. The results suggested that the UVE-PLS spectral model is promising for predicting Cr, Pb, and Cd, and can be improved for predicting Cu, Co, and Zn elements in agricultural soils.</p>
</abstract>
<kwd-group>
<kwd>hyperspectral data</kwd>
<kwd>spectroscopy</kwd>
<kwd>soil analysis</kwd>
<kwd>heavy metals</kwd>
<kwd>variable selection</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Environmental Informatics and Remote Sensing</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Potentially toxic elements (PTEs) accumulation in agricultural soils can cause serious health problems for humans and negatively impact ecosystems (<xref ref-type="bibr" rid="B25">Khan et al., 2008</xref>; <xref ref-type="bibr" rid="B57">Zhang et al., 2009</xref>). PTEs, such as cadmium (Cd), chromium (Cr), cobalt (Co), copper (Cu), lead (Pb), and zinc (Zn), constitute a significant group of soil contaminants (<xref ref-type="bibr" rid="B7">Bruemmer et al., 1986</xref>). These elements endanger human and animal health by entering the water, soil, plants, and food chain (<xref ref-type="bibr" rid="B16">Gholizadeh et al., 2018</xref>). Because of their persistence and long biological half-lives, they disrupt the nutrient balance in the soil and reduce plant growth (<xref ref-type="bibr" rid="B43">Shi et al., 2018</xref>). As a result, quantification of PTEs in the soil is critical for efficient monitoring and subsequent remediation. Traditionally, PTEs have been quantified using wet chemistry, such as inductively coupled plasma (ICP) analysis or atomic absorption spectrometry (AAS). These methods are time-consuming, expensive, and unsuitable for many soil samples (<xref ref-type="bibr" rid="B35">Nawar et al., 2020</xref>). Therefore, there is a rising need for detection and measurement equipment that can be used on-site and in real-time, which has contributed to advancing new techniques such as visible and near-infrared spectroscopy (Vis-NIRS).</p>
<p>Vis-NIRS is a commonly effective tool for soil analysis, such as soil organic carbon (SOC), texture, nutrients, and PTEs. Modern instrumental spectroscopic technologies analyse samples at high resolution, yielding many spectral variables per sample. The high-resolution measurement can result in large predictors (p) and small (n) samples, which occur when the number of spectral variables exceeds the number of samples, and have posed difficulties in analysing the relationship between the target (e.g., soil properties) and spectral variables. Therefore, appropriate statistics algorithms are required to extract useful information from spectra. Partial least squares regression (PLSR) is a widely used algorithm coupled with variable selection strategies (<xref ref-type="bibr" rid="B54">Xiaobo et al., 2010</xref>). PLSR is a popular multivariate regression technique that can handle many noisy and correlated variables and small samples (<xref ref-type="bibr" rid="B51">Wold et al., 2001</xref>; <xref ref-type="bibr" rid="B13">Forina et al., 2004</xref>). The potential of Vis-NIRS coupled with PLSR was examined by <xref ref-type="bibr" rid="B29">Kooistra et al. (2001)</xref>, who reported a <ext-link ext-link-type="uri" xlink:href="http://www.r-tutor.com/elementary-statistics/simple-linear-regression/coefficient-determination">coefficient of determination</ext-link> (R<sup>2</sup>) of 0.88 and 0.90 for estimating Cd and Zn, respectively, in river floodplains (Netherlands). The PLSR was also used to estimate Cr and Ni concertations in soil samples (<xref ref-type="bibr" rid="B20">Han et al., 2021</xref>), reporting R<sup>2</sup> of 0.69&#x2013;0.71. However, removing uninformative variables improves PLS calibration performance (<xref ref-type="bibr" rid="B45">Spiegelman et al., 1998</xref>; <xref ref-type="bibr" rid="B3">Andries et al., 2011</xref>, <xref ref-type="bibr" rid="B4">2017</xref>). Besides better PLS model interpretation, lower measurement costs and a lower risk of overfitting may be obtained (<xref ref-type="bibr" rid="B2">Andersen and Bro, 2010</xref>).</p>
<p>Variable selection algorithms are well-known for improving model robustness and precision, excluding noisy spectral regions and collinear wavelengths (<xref ref-type="bibr" rid="B54">Xiaobo et al., 2010</xref>). For PLS, many variable elimination methods have been published (<xref ref-type="bibr" rid="B14">Gauchi and Chagnon, 2001</xref>; <xref ref-type="bibr" rid="B54">Xiaobo et al., 2010</xref>; <xref ref-type="bibr" rid="B60">Huang et al., 2019</xref>; <xref ref-type="bibr" rid="B61">Mehmood et al., 2020</xref>), among which are the uninformative variable elimination (UVE) for PLSR (UVE-PLS) (<xref ref-type="bibr" rid="B8">Centner et al., 1996</xref>) and simulated annealing (SA) (<xref ref-type="bibr" rid="B22">Kalivas et al., 1989</xref>). UVE-PLS is a variable elimination method based on the PLSR regression coefficients&#x2019; significance. Variable importance is determined by PLSR regression coefficients and the standard deviation is calculated based on cross-validation (e.g., jackknifing). The variables with values less than the calculated threshold from the random process within the cross-validation are removed. SA has shown promising results in improving PLSR calibrations in various matrices (<xref ref-type="bibr" rid="B6">Balabin and Smirnov, 2011</xref>; <xref ref-type="bibr" rid="B31">Liu et al., 2019</xref>; <xref ref-type="bibr" rid="B18">Guo et al., 2020</xref>). The SA is a probabilistic optimization technique that accepts non-optimizing solutions with a predetermined probability of avoiding being trapped in a local minimum (<xref ref-type="bibr" rid="B46">Swierenga et al., 1998</xref>).</p>
<p>Industrial activities and long-term applications of inorganic fertilizers have heavily impacted agricultural soils in several regions of Egypt and other countries over the last few decades. Furthermore, the high-cost laboratory analysis of PTEs for large samples compared with the proximal sensing method (<xref ref-type="bibr" rid="B35">Nawar et al., 2020</xref>). Therefore, there is a growing need for versatile and cost-effective methods that can be developed based on limited reference samples for rapidly quantifying soil contaminants by PTEs. This study aimed to investigate the feasibility and cost-effectiveness of Vis&#x2013;NIRS to quantify key PTEs (e.g., Cd, Co, Cu, Cr, Pb, and Zn) in limited samples from arid agricultural soils of a polluted area close to the Nile River in Egypt. The main objectives were: (i) to explore the potential of vis&#x2013;NIRS for predicting the key PTEs and (ii) to compare the performance of spectral models using the PLSR method with spectral full-range (FR-PLS) and selected spectral datasets based on uninformative variable elimination (UVE-PLS) and the simulated annealing (SA-PLS), for models calibration and predictions of the target key PTEs.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Study area</title>
<p>The study area is located along with both sides El-Moheet drainage, Minya Governorate, Upper Egypt (<xref ref-type="fig" rid="F1">Figure 1</xref>). This drainage extends south to north of serving the Governorate, with a length of about 100&#xa0;km. However, it is considered the most dangerous source of pollution to the environment in this area. The study area occupied about 28,94&#xa0;km<sup>2</sup> (27&#xb0; 56&#x2032;30&#x2033;to 28&#xb0; 04&#x2032;35&#x2033;N, and 30&#xb0; 43&#x2032;09&#x2033;to 30&#xb0; 48&#x2032;51&#x2033;E). The area is almost flat, with elevations between 38 and 41&#xa0;m above sea level. Arid conditions characterize the study area, including a hot summer, a warm winter, high evaporation, and low rainfall intensity. The average annual temperature during the winter months is about 29&#xb0;C, while it reaches 41&#xb0;C in the summer (<xref ref-type="bibr" rid="B33">Mayhoub and Azzam, 1997</xref>). The soil of the study area is located among the alluvial floodplain deposits of the Nile River, with dominant texture ranges between silt and clay. Based on the soil taxonomy (<xref ref-type="bibr" rid="B59">Soil Survey Staff, 2022</xref>), the soils were classified to the suborder level as <italic>Entic Calcitorrerts</italic>, <italic>Typic Haplotorrerts</italic>, and <italic>Haplotorrrerts</italic>. The study area is mainly cultivated with wheat, corn, soybeans, cotton, potatoes, and sugar cane (<xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Location map of the study area and the soil samples.</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>2.2 Soil analyses and spectral measurement</title>
<p>Eighty soil samples were collected (60&#xa0;at 0&#x2013;20&#xa0;cm and 20&#xa0;at 20&#x2013;40&#xa0;cm) to create the soil spectral library. Sixty sampling locations were selected randomly to cover the soil spatial variability regarding land use, texture, and slope variation within the study area. For the surface sampling (0&#x2013;20&#xa0;cm), around 1&#xa0;kg of soil was taken at each location, and the sampling positions were recorded using GPS (<xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>). To introduce the PTEs variability with depth to the spectral library, additional twenty subsurface samples (20&#x2013;40&#xa0;cm) were randomly selected at 20 locations out of the sixty locations. The limited subsurface samples were due to budget limitations. The samples were prepared by manually removing the non-soil materials (e.g., grass, roots, stone/gravel). Each soil sample was thoroughly mixed and quartered, bringing the total weight down to about 300&#xa0;g, and is air-derided before being ground and sieved (2&#xa0;mm) to obtain the fine earth (<xref ref-type="bibr" rid="B30">Liu et al., 2020</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). Finally, each sample was divided into two parts of about 150&#xa0;g each for chemical and spectral analyses.</p>
<sec id="s2-2-1">
<title>2.2.1 Soil chemical analyses</title>
<p>Each sample was first transferred to the National Authority for Remote Sensing and Space Sciences (NARSS), where the chemical analyses were performed. The soil organic carbon (SOC) content was determined by Walkley and Black procedure (<xref ref-type="bibr" rid="B50">Walkley and Black, 1934</xref>). For the extraction and quantification of total PTEs, the aqua regia digestion method was used (<xref ref-type="bibr" rid="B40">Page et al., 1982</xref>). Briefly, 0.25&#xa0;g of soil was extracted with a mixture of concentrated nitric and hydrochloric acids (7&#xa0;mL and 2&#xa0;mL, respectively) using the microwave instrument at 200&#xb0;C. The extraction was then made up to 50&#xa0;mL volume by adding water. The PTEs analysis was performed by ICP-MS (Thermo, model iCAP-RQ). Using 1:2.5 soil water suspension, the soil pH was measured by the pH-meter Jenway (<xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>).</p>
</sec>
<sec id="s2-2-2">
<title>2.2.2 Spectra collection</title>
<p>The second part of each sample was thoroughly mixed and placed in plastic cups with diameters of 4.9 and 2&#xa0;cm in height. The sample surface was leveled and smoothed with a spatula to achieve optimal diffuse reflection. The soil spectra were measured in reflectance format using an ASD FieldSpec 4 spectroradiometer (Malvern Panalytical Inc., Westborough, USA) with a full range (350&#x2013;2,500&#xa0;nm). The spectral resolution varies from 3&#xa0;nm in the 700&#xa0;nm range to 6&#xa0;nm in the 1,400&#x2013;2,100&#xa0;nm range. The samples were scanned by a high-intensity probe with a light source (built-in) that was used in contact with complete darkness conditions. Before sample scanning, the ASD instrument was started and allowed to warm up for 30&#xa0;min and then calibrated with a white reference (99% reflection). Five successive spectra were taken and averaged to produce one representative spectrum of each soil sample.</p>
</sec>
<sec id="s2-2-3">
<title>2.2.3 Spectral data preprocessing</title>
<p>The same spectral data preprocessing was performed for all PTEs investigated using Python. First, the noise at both edges was removed by cutting the range outside 450&#x2013;2,450&#xa0;nm. Then, spectra were subjected to a second derivative with a Savitzky&#x2013;Golay smoothing (SDSG) technique (<xref ref-type="bibr" rid="B42">Savitzky and Golay, 1964</xref>). The SDSG was calculated using a second-order polynomial, which fit 13-point-width spectral windows. The derivatives methods can eliminate the spectra&#x2019;s baseline drift, enhance absorption features, and extract relevant information from the near-infrared range (<xref ref-type="bibr" rid="B12">Ertlen et al., 2010</xref>). The derivatives of spectral data (first and second) have been used to improve the prediction of PTEs, e.g., Cd, Cu, Pb, and Zn (<xref ref-type="bibr" rid="B26">Khosravi et al., 2018</xref>; <xref ref-type="bibr" rid="B32">Liu et al., 2018</xref>).</p>
</sec>
</sec>
<sec id="s2-3">
<title>2.3 Statistical analysis</title>
<sec id="s2-3-1">
<title>2.3.1 Model based on full spectral range and partial least squares regression (FR-PLS)</title>
<p>PLSR is a multivariate analysis technique that projects the X variables (predictors) and the Y variable (response), to a new space to model the linear relationship (<xref ref-type="bibr" rid="B51">Wold et al., 2001</xref>). The algorithm projects information in the original X data onto a small number of essential orthogonal variables (components).</p>
<p>To develop the FR-PLS models, a two-dimensional data matrix comprised of the Xi variables (full spectral data (450&#x2013;2,450&#xa0;nm)) and Yi variables (PTEs values) was created. Before running the analysis, the entire dataset was divided into 75% for calibration and 25% for prediction using the Kennard-Stone (KS) algorithm (<xref ref-type="bibr" rid="B24">Kennard and Stone, 1969</xref>). PLSR with k-fold cross-validation (k &#x3d; 5) correlated the variation in a target variable (e.g., PTEs) to the variation in multi-component variables (wavelengths) by using the sklearn. decomposition module available in Python. The optimal number of components (NC) (latent variables) was determined based on the NC with the smallest root mean squared error of cross-validation (RMSEcv). The best performance calibration model (lowest RMSEcv) was tested using the validation (prediction) set.</p>
</sec>
<sec id="s2-3-2">
<title>2.3.2 Models based on features selection algorithms and PLSR</title>
<p>Removing unrelated variables, omitting redundancies, and selecting the most relevant variables from spectral data are necessary to improve model accuracy (<xref ref-type="bibr" rid="B55">Xu et al., 2019</xref>). The feature selection methods reduce complexity while retaining the most valuable wavelengths highly correlated with the predicted variables (<xref ref-type="bibr" rid="B54">Xiaobo et al., 2010</xref>). In the current study, two algorithms, uninformative variable elimination (UVE) (<xref ref-type="bibr" rid="B8">Centner et al., 1996</xref>) and simulated annealing (SA) (<xref ref-type="bibr" rid="B27">Kirkpatrick et al., 1983</xref>), were used to choose the essential spectral features for PTE assessment. These methods were used to develop spectral models and compared with those based on full-range spectral data (FR-PLS) developed in section 2.3.1.</p>
<sec id="s2-3-2-1">
<title>2.3.2.1 Models based on simulated annealing (SA) and PLSR (SA-PLS)</title>
<p>SA is a stochastic global search optimization algorithm. Variable selection by SA improves the model&#x2019;s transferability and predictive accuracy (<xref ref-type="bibr" rid="B46">Swierenga et al., 1998</xref>). For wavelength selection, the SA solution is denoted as a string of numbers containing k values representing the variables to be selected from N variables from the calibration set (X). The X variables combined with PTEs values (Y) were used to develop a PLSR model with predetermined components (<xref ref-type="bibr" rid="B54">Xiaobo et al., 2010</xref>). SA typically defines and attempts to reduce a cost function, namely, the root mean square error in cross-validation (RMSE<sub>CV</sub>). The goal is to define a hyper-parameter&#x2014;the number of bands that must be retained (N)&#x2014;that is less than the total number of bands during the optimisation process. The procedure includes fitting a PLSR model with the optimal number of latent variables and calculating the RMSE<sub>CV</sub> (cost function) iteratively. At each step, three bands were randomly swapped, and the RMSE<sub>CV</sub> of the optimised PLSR was calculated. The selected bands are returned at the end of the procedure, along with the optimal number of PLSR model components associated with such a band selection and the value of the RMSE<sub>CV</sub> at each iteration.</p>
</sec>
<sec id="s2-3-2-2">
<title>2.3.2.2 Models based on uninformative variable elimination (UVE) and PLSR (UVE-PLS)</title>
<p>The UVE technique selects variables with the highest correlation with the response, observing only the properties inherent in the spectral data. The variable selection-based VE method uses the PLSR algorithm output to identify only a subset of important variables for variable identification. Variables are chosen in two stages when using a filter. First, the PLSR model is developed based on the given data, and then the variables are selected by introducing a threshold based on the results of the developed model. The feature&#x2019;s relevance score is then calculated individually, excluding feature interactions. The UVE-PLS method was developed in the following steps: (1) optimise the PLSR using the entire spectrum, (2) extract the regression coefficients that associate each wavelength with the response, and (3) discard the lowest correlation wavelengths one at a time, (4) rebuild the calibration model using the lowest RMSE of cross-validation as the metric in iteration until the RMSE decreases, and (5) remove a fixed number of wavelengths iteratively until the RMSEcv decreases.</p>
</sec>
</sec>
<sec id="s2-3-3">
<title>2.3.3 Models accuracy assessment</title>
<p>The performance of the spectral models in predicting the PTEs was assessed based on the calculated values of the coefficient of determination (R<sup>2</sup>), RMSE, and the ratio of performance to deviation (RPD) described as follows:<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
</mml:munderover>
</mml:mstyle>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>
<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m3">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>D</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
</p>
<p>Where the measured <inline-formula id="inf1">
<mml:math id="m4">
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula> and predicted <inline-formula id="inf2">
<mml:math id="m5">
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula> are the values for sample i; <inline-formula id="inf3">
<mml:math id="m6">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf4">
<mml:math id="m7">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> are the mean of the observed and predicted values, respectively. The std is the standard deviation of the samples. Six performance classes were adopted according to the suggested classes by <xref ref-type="bibr" rid="B48">Viscarra Rossel et al. (2006)</xref>: very poor model (RPD &#x3c;1.0), poor (RPD &#x3d; 1.0&#x2013;1.4), fair (RPD &#x3d; 1.4&#x2013;1.8), good (RPD &#x3d; 1.8&#x2013;2.0), very good (RPD &#x3d; 2.0&#x2013;2.5), and excellent (RPD &#x3e;2.5).</p>
</sec>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Soil and spectral data</title>
<p>
<xref ref-type="table" rid="T1">Table 1</xref> presents the statistics of pH, SOC, and the tested elements. The soil pH values ranged between 7.79 and 8.56 with a mean value of 8.15. The SOC content ranged between 2,460&#xa0;mg kg<sup>-1</sup> and 25710&#xa0;mg kg<sup>-1</sup> with a mean value of 10948&#xa0;mg kg<sup>-1</sup>. The contents of Cd have the lowest content, ranging between 0.05 and 2.07&#xa0;mg kg<sup>-1,</sup> with mean and SD of 0.79 and 0.46&#xa0;mg kg<sup>-1</sup>, respectively. The values of Fe, Zn, and Cr followed the highest contents with mean values of 137.55, 83.11, and 79.52&#xa0;mg kg<sup>-1</sup>, maximum values of 210.43, 131.13, and 127.16&#xa0;mg kg<sup>-1</sup>, and SD of 21.43, 12.67, and 18.57&#xa0;mg kg<sup>-1</sup>, respectively. The contents of Pb and Co are comparable with mean values of 30.04 and 28.54&#xa0;mg kg<sup>-1</sup> and maximum values of 106.54 and 43.52&#xa0;mg kg<sup>-1</sup>, respectively. The contents of Cu ranged between 34.25 and 91.40&#xa0;mg kg<sup>-1,</sup> with a mean value of 50.22&#xa0;mg kg<sup>-1</sup>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Descriptive statistics of the soil samples (80) analysed for pH, soil organic carbon (SOC), iron (Fe), cadmium (Cd), copper (Cu), cobalt (Co), chromium (Cr), lead (Pb), and zinc (Zn) analysed with inductively coupled plasma mass spectrometry (ICP-MS) for the total contents (mg kg<sup>-1</sup>).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left"/>
<th align="center">pH</th>
<th align="center">SOC</th>
<th align="center">Fe</th>
<th align="center">Cd</th>
<th align="center">Cu</th>
<th align="center">Co</th>
<th align="center">Cr</th>
<th align="center">Pb</th>
<th align="center">Zn</th>
</tr>
<tr>
<th colspan="10" align="center">mg kg-1</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<bold>No.</bold>
</td>
<td align="right">80</td>
<td align="right">80</td>
<td align="right">80</td>
<td align="right">80</td>
<td align="right">80</td>
<td align="right">76</td>
<td align="right">76</td>
<td align="right">78</td>
<td align="right">76</td>
</tr>
<tr>
<td align="left">
<bold>min</bold>
</td>
<td align="right">7.79</td>
<td align="right">2,460</td>
<td align="right">85.82</td>
<td align="right">0.05</td>
<td align="right">34.25</td>
<td align="right">20.61</td>
<td align="right">53.09</td>
<td align="right">13.52</td>
<td align="right">61.71</td>
</tr>
<tr>
<td align="left">
<bold>Q1</bold>
</td>
<td align="right">8.07</td>
<td align="right">7,565</td>
<td align="right">121.78</td>
<td align="right">0.52</td>
<td align="right">44.64</td>
<td align="right">24.17</td>
<td align="right">66.97</td>
<td align="right">20.75</td>
<td align="right">74.12</td>
</tr>
<tr>
<td align="left">
<bold>Med</bold>
</td>
<td align="right">8.16</td>
<td align="right">11080</td>
<td align="right">137.23</td>
<td align="right">0.64</td>
<td align="right">48.43</td>
<td align="right">27.27</td>
<td align="right">74.14</td>
<td align="right">24.67</td>
<td align="right">81.36</td>
</tr>
<tr>
<td align="left">
<bold>Q3</bold>
</td>
<td align="right">8.26</td>
<td align="right">14005</td>
<td align="right">150.41</td>
<td align="right">1.07</td>
<td align="right">52.53</td>
<td align="right">32.78</td>
<td align="right">90.09</td>
<td align="right">32.26</td>
<td align="right">88.98</td>
</tr>
<tr>
<td align="left">
<bold>max</bold>
</td>
<td align="right">8.56</td>
<td align="right">25710</td>
<td align="right">210.43</td>
<td align="right">2.07</td>
<td align="right">91.40</td>
<td align="right">43.52</td>
<td align="right">127.16</td>
<td align="right">106.54</td>
<td align="right">131.13</td>
</tr>
<tr>
<td align="left">
<bold>mean</bold>
</td>
<td align="right">8.15</td>
<td align="right">10984</td>
<td align="right">137.55</td>
<td align="right">0.79</td>
<td align="right">50.22</td>
<td align="right">28.54</td>
<td align="right">79.52</td>
<td align="right">30.04</td>
<td align="right">83.11</td>
</tr>
<tr>
<td align="left">
<bold>SD</bold>
</td>
<td align="right">0.15</td>
<td align="right">4,753</td>
<td align="right">21.43</td>
<td align="right">0.46</td>
<td align="right">10.53</td>
<td align="right">5.54</td>
<td align="right">18.57</td>
<td align="right">16.50</td>
<td align="right">12.67</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Note: SD, standard deviation, Q1 &#x3d; first quartile, Q3 &#x3d; third quartile.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>
<xref ref-type="fig" rid="F2">Figure 2</xref> presents the calculated Pearson correlation coefficients (r) between pH, SOC content, and PTEs concentrations. A positive correlation was observed between the tested PTEs, except a negative correlation between Co and Fe. The highest coefficient value was observed between Cr and Cd (r &#x3d; 0.82). The high correlations were observed between Cr and the other PTEs with r values of 0.60 with Cu, 0.53 with Pb, and 0.43 with Zn, but a very low correlation with Co (r &#x3d; 0.23). The correlation between Cr and Fe was high (r &#x3d; 0.63). SOC demonstrated a low correlation with Cu, Co, and Zn, very low with Cd, Cr, and Pb, and negative with Fe (r &#x3d; - 0.11). The pH showed moderate negative correlations with Cd, Cr, Zn, Pb, and Cu (&#x2212;0.33 &#x2264; r &#x2264; &#x2212;0.49), but showed the negative weak correlations with Co and Fe (r &#x3d; &#x2212;0.21 and &#x2212;0.18). Also, a medium negative correlation was found between pH and SOC (r &#x3d; &#x2212;0.36).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The correlation coefficients (Pearson) between the measured PTEs, e.g., chromium (Cr), cobalt (Co), cadmium (Cd), zinc (Zn), copper (Cu), iron (Fe), and lead (Pb), soil organic carbon (SOC), and pH.</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g002.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 Soil spectra</title>
<p>The raw and processed spectral data of the soil samples are presented in <xref ref-type="fig" rid="F3">Figure 3</xref>. The main features at 450&#x2013;550&#xa0;nm, 900&#xa0;nm, 1,400&#xa0;nm, 1900&#xa0;nm, and 2,200&#xa0;nm are observed (<xref ref-type="fig" rid="F3">Figure 3A</xref>), but the absorption characteristics were not significant enough. The second derivative spectra indicated that the baseline drift and mixed overlapping peaks were gradually eliminated, thereby more detailed information and characteristic peaks appeared (<xref ref-type="fig" rid="F3">Figure 3B</xref>). The second derivative spectra showed six regions of the spectrum that exhibit distinct absorption features around 480&#x2013;550&#xa0;nm, 1,400&#xa0;nm, 1900&#xa0;nm, 2,200&#xa0;nm, 2,300, and 2,400&#xa0;nm. The absorption features in the visible region are typically broad, while the features in the infrared region (e.g., 2,200 or 2,300&#xa0;nm) are usually narrower and sharper. The absorption features around 1,400 and 1900&#xa0;nm are associated with hydroxyl (OH) and water. The region between 2000 and 2,400&#xa0;nm is associated with the components of organic matter.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The raw spectra <bold>(A)</bold> and the processed spectra using the second derivative <bold>(B)</bold>.</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g003.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>3.3 Performance of PLSR-based full spectral range (FR-PLS) models</title>
<p>The results of estimating PTEs based on the FR-PLS models in cross-validation and prediction are presented in <xref ref-type="table" rid="T2">Table 2</xref>. The performance of the models in cross-validation was poor to fair (1.07 &#x2264; RPD &#x2264;1.47). <xref ref-type="table" rid="T2">Table 2</xref> shows that the best results were obtained for the Cr (R<sup>2</sup> &#x3d; 0.54, RMSEcv &#x3d; 13.40&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.47), followed by Zn, Pb, Co, and Cu, respectively. The worst results were obtained for Cd (R<sup>2</sup> &#x3d; 0.13, RMSEcv &#x3d; 0.40&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.07).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>The cross-validation and prediction (validation) results of PLSR models based on: a full range (FR-PLS), simulated annealing (SA-PLS), and uninformative variable elimination (UVE-PLS) of Vis-NIR spectral data for estimating cadmium (Cd), copper (Cu), cobalt (Co), chromium (Cr), lead (Pb), and zinc (Zn).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left"/>
<th align="left"/>
<th align="left"/>
<th align="left"/>
<th colspan="3" align="center">Cross-validation</th>
<th colspan="3" align="center">Validation</th>
</tr>
<tr>
<th align="left"/>
<th align="center">Data set</th>
<th align="left"/>
<th align="left"/>
<th align="center">R<sup>2</sup>
</th>
<th align="center">RMSEcv</th>
<th align="center">RPD</th>
<th align="center">R<sup>2</sup>
</th>
<th align="center">RMSEP</th>
<th align="center">RPD</th>
</tr>
<tr>
<th align="left"/>
<th align="left"/>
<th align="center">NC</th>
<th align="center">NV</th>
<th align="left"/>
<th align="center">(mg kg<sup>-1</sup>)</th>
<th align="left"/>
<th align="left"/>
<th align="center">(mg kg<sup>-1</sup>)</th>
<th align="left"/>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<bold>Cd</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">2</td>
<td align="center">2,150</td>
<td align="center">0.13</td>
<td align="center">0.40</td>
<td align="center">1.07</td>
<td align="center">0.12</td>
<td align="center">0.45</td>
<td align="center">1.00</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">8</td>
<td align="center">200</td>
<td align="center">0.58</td>
<td align="center">0.31</td>
<td align="center">1.55</td>
<td align="center">0.47</td>
<td align="center">0.27</td>
<td align="center">1.52</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">6</td>
<td align="center">252</td>
<td align="center">0.73</td>
<td align="center">0.23</td>
<td align="center">1.92</td>
<td align="center">0.62</td>
<td align="center">0.24</td>
<td align="center">1.86</td>
</tr>
<tr>
<td align="center">
<bold>Cu</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">4</td>
<td align="center">2,150</td>
<td align="center">0.20</td>
<td align="center">9.40</td>
<td align="center">1.11</td>
<td align="center">0.19</td>
<td align="center">9.29</td>
<td align="center">1.05</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">9</td>
<td align="center">200</td>
<td align="center">0.59</td>
<td align="center">6.77</td>
<td align="center">1.60</td>
<td align="center">0.53</td>
<td align="center">5.75</td>
<td align="center">1.61</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">5</td>
<td align="center">239</td>
<td align="center">0.72</td>
<td align="center">6.08</td>
<td align="center">1.88</td>
<td align="center">0.59</td>
<td align="center">3.83</td>
<td align="center">1.78</td>
</tr>
<tr>
<td align="center">
<bold>Co</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">3</td>
<td align="center">2,150</td>
<td align="center">0.30</td>
<td align="center">5.57</td>
<td align="center">1.08</td>
<td align="center">0.15</td>
<td align="center">4.28</td>
<td align="center">1.02</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">9</td>
<td align="center">200</td>
<td align="center">0.57</td>
<td align="center">3.63</td>
<td align="center">1.53</td>
<td align="center">0.46</td>
<td align="center">3.26</td>
<td align="center">1.47</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">9</td>
<td align="center">370</td>
<td align="center">0.69</td>
<td align="center">3.13</td>
<td align="center">1.80</td>
<td align="center">0.52</td>
<td align="center">2.49</td>
<td align="center">1.68</td>
</tr>
<tr>
<td align="center">
<bold>Cr</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">3</td>
<td align="center">2,150</td>
<td align="center">0.54</td>
<td align="center">13.40</td>
<td align="center">1.47</td>
<td align="center">0.39</td>
<td align="center">28.97</td>
<td align="center">1.10</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">10</td>
<td align="center">200</td>
<td align="center">0.62</td>
<td align="center">13.13</td>
<td align="center">1.65</td>
<td align="center">0.56</td>
<td align="center">18.79</td>
<td align="center">1.62</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">17</td>
<td align="center">118</td>
<td align="center">0.76</td>
<td align="center">8.71</td>
<td align="center">2.03</td>
<td align="center">0.74</td>
<td align="center">8.29</td>
<td align="center">2.48</td>
</tr>
<tr>
<td align="center">
<bold>Pb</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">10</td>
<td align="center">2,150</td>
<td align="center">0.40</td>
<td align="center">18.83</td>
<td align="center">1.39</td>
<td align="center">0.14</td>
<td align="center">25.87</td>
<td align="center">1.02</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">9</td>
<td align="center">200</td>
<td align="center">0.42</td>
<td align="center">13.21</td>
<td align="center">1.41</td>
<td align="center">0.31</td>
<td align="center">9.57</td>
<td align="center">1.30</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">10</td>
<td align="center">120</td>
<td align="center">0.75</td>
<td align="center">8.28</td>
<td align="center">2.00</td>
<td align="center">0.72</td>
<td align="center">7.79</td>
<td align="center">2.03</td>
</tr>
<tr>
<td align="center">
<bold>Zn</bold>
</td>
<td align="center">FR-PLS</td>
<td align="center">4</td>
<td align="center">2,150</td>
<td align="center">0.48</td>
<td align="center">21.736</td>
<td align="center">1.39</td>
<td align="center">0.14</td>
<td align="center">27.86</td>
<td align="center">1.01</td>
</tr>
<tr>
<td align="left"/>
<td align="center">SA-PLS</td>
<td align="center">10</td>
<td align="center">200</td>
<td align="center">0.60</td>
<td align="center">21.33</td>
<td align="center">1.57</td>
<td align="center">0.40</td>
<td align="center">7.89</td>
<td align="center">1.35</td>
</tr>
<tr>
<td align="left"/>
<td align="center">UVE-PLS</td>
<td align="center">6</td>
<td align="center">219</td>
<td align="center">0.67</td>
<td align="center">7.54</td>
<td align="center">1.75</td>
<td align="center">0.46</td>
<td align="center">5.85</td>
<td align="center">1.41</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Note: RPD, ratio of performance to deviation; NC, the number of components; NV, number of variables.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The prediction results were less than the cross-validation with very poor performance (1.00 &#x2264; RPD &#x2264;1.10). The best results were obtained for Cr (R<sup>2</sup> &#x3d; 0.39, RMSEP &#x3d; 28.97&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.10), followed by Cu, Co, Pb, and Zn, respectively (<xref ref-type="table" rid="T2">Table 2</xref>). The worst results were obtained for Cd (R<sup>2</sup> &#x3d; 0.12, RMSEP &#x3d; 0.45&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.00).</p>
</sec>
<sec id="s3-4">
<title>3.4 Performance of PLSR-based simulated annealing (SA-PLS) models</title>
<p>The results of SA-PLS models in cross-validation and prediction are presented in <xref ref-type="table" rid="T2">Table 2</xref>. The performance of SA-PLS models in cross-validation and prediction was better than those of FR-PLS models. The SA-PLS models&#x2019; performance in cross-validation was fair (1.41 &#x2264; RPD &#x2264;1.65). The best results were obtained for the Cr (R<sup>2</sup> &#x3d; 0.62, RMSEcv &#x3d; 13.13&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.65) followed by Zn, Cu, Cd, and Co, respectively (<xref ref-type="table" rid="T2">Table 2</xref>). The worst results were obtained for Pb (R<sup>2</sup> &#x3d; 0.42, RMSEcv &#x3d; 13.21&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.41) (<xref ref-type="table" rid="T2">Table 2</xref>). The prediction results followed the trend of cross-validation with fair to poor performance (1.30 &#x2264; RPD &#x2264;1.62). The best results were obtained for Cr (R<sup>2</sup> &#x3d; 0.56, RMSEP &#x3d; 18.79&#xa0;mg&#xa0;kg<sup>-1</sup>, and RPD &#x3d; 1.62), followed by Cu, Cd, Co, and Zn, respectively (<xref ref-type="table" rid="T2">Table 2</xref>). The worst prediction results were obtained for Pb (R<sup>2</sup> &#x3d; 0.31, RMSEP &#x3d; 9.57&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.30).</p>
</sec>
<sec id="s3-5">
<title>3.5 Performance of PLSR-based uninformative variable elimination (UVE-PLS) models</title>
<p>In all cases, the UVE-PLS outperformed the SA-PLS and FR-PLS models, resulting in a good cross-validation performance and predictions (<xref ref-type="table" rid="T2">Table 2</xref>; <xref ref-type="fig" rid="F4">Figure 4</xref> &#x26;5). The performance of UVE-PLS in cross-validation was fair to very good (1.75 &#x2264; RPD &#x2264;2.03). The highest cross-validation performance was for Cr (R<sup>2</sup> &#x3d; 0.76, RMSEcv &#x3d; 8.71&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 2.03), followed by Pb, Cd, Cu, and Co, respectively. The worst performance was obtained for Zn with R<sup>2</sup> &#x3d; 0.67, RMSEcv &#x3d; 7.54&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.75 (<xref ref-type="table" rid="T2">Table 2</xref>; <xref ref-type="fig" rid="F4">Figure 4</xref>). The prediction results showed the same trend of the cross-validation, with fair to very good performance (1.41 &#x2264; RPD &#x2264;2.48). The best performance was obtained for Cr (R<sup>2</sup> &#x3d; 0.74, RMSEP &#x3d; 8.29&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 2.48), followed by Pb, Cd, Cu, and Co. The worst performance was obtained for Zn with R<sup>2</sup> &#x3d; 0.46, RMSEP &#x3d; 5.85&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.41 (<xref ref-type="table" rid="T2">Table 2</xref>; <xref ref-type="fig" rid="F5">Figure 5</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>The cross-validation results of the UVE-PLS models for the tested PTEs Cd <bold>(A)</bold>, Cu <bold>(B)</bold>, Co <bold>(C)</bold>, Cr <bold>(D)</bold>, Pb <bold>(E)</bold>, and Zn <bold>(F)</bold>.</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>The prediction results of the UVE-PLS models for the tested PTEs Cd <bold>(A)</bold>, Cu <bold>(B)</bold>, Co <bold>(C)</bold>, Cr <bold>(D)</bold>, Pb <bold>(E)</bold>, and Zn <bold>(F)</bold>.</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g005.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>3.6 Comparison of the models (FR-PLS, SA-PLS, and UVE-PLS) performance</title>
<p>The spectral models based on PLSR and different spectral datasets provided diverse performances. The UVE-PLS method outperformed the SA-PLS in reducing variables and improving the prediction results. The best prediction results were achieved with UVE-PLS with very good performance for Cr with R<sup>2</sup> &#x3d; 0.74, RMSEP &#x3d; 8.29&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 2.48 (<xref ref-type="fig" rid="F6">Figures 6A&#x2013;C</xref>, respectively). The SA-PLS provided a fair prediction for Cr with R<sup>2</sup> &#x3d; 0.56, RMSE of 18.79&#xa0;mg kg<sup>-1</sup>, and RPD of 1.62. Where the performance of Cr prediction based on FR-PLS was very poor R<sup>2</sup> &#x3d; 0.39, RMSE &#x3d; 28.97&#xa0;mg kg<sup>-1</sup>, and RPD &#x3d; 1.10. These results indicated a substantial accuracy improvement in the Cr UVE-PLS model. The improvement in R<sup>2</sup> (increasing by 89.7%), a reduction in RMSE by 71.4%, and an increase in RPD by 125.4%, compared with Cr FR-PLS models. Compared the results of Cr UVE-PLS with the results of Cr SA-PLS, R<sup>2</sup> increased by 32.1%, RMSE reduced by 55.9%, and RPD increased by 53.1%. Similarly, the predictions of the other PTEs (Cd, Co, Cu, Pb, and Zn) based UVE-PLS models were improved as R<sup>2</sup> increased by 67%&#x2013;440% and 11.3%&#x2013;132.2%, RMSE reduced by 32.4%&#x2013;81.3% and 11.1%&#x2013;55.9%, and RPD increased by 56.4%&#x2013;83.0% and 4.4%&#x2013;53.0% compared with the results of Cd, Co, Cu, Pb, and Zn based on FR-PLS and SA-PLS models, respectively.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>The histogram plots of R<sup>2</sup> <bold>(A)</bold>, RMSEP <bold>(B)</bold>, and RPD <bold>(C)</bold> based on values resulted from the spectral models FR-PLS, SA-PLS, and UVE-PLS for the tested PTEs (Cd, Co, Cu, Cr, Pb, and Zn).</p>
</caption>
<graphic xlink:href="fenvs-11-1222871-g006.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>The PTEs concentrations are characterised by considerable variability as a result of the soil composition, the land use, and the arid nature of the study area. The soils of the study area were classified into three levels: moderate, considerable, and very high levels of contamination. The majority (70.7%) of the study area had high PTEs concentrations, with average concentrations (mg kg<sup>-1</sup>) of Cr, Co, Cu, Cd, Pb, and Zn being 91.23, 29.44, 53.83, 1.12, 36.04, and 101.29, respectively (<xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>). The positive relationship between PTEs each other and with Fe content (except Co) signifies that PTEs have the same source in the study area. The location of the study area&#x2013;around the El-Moheet drainage&#x2014;on the west side of the Nile River (Egypt), strongly contributed to the soil characteristics and the contamination in the study area. The mineralogical composition of the study area is composed of Holocene silts and clays, due to Nile flooding deposition, which covers the whole area (<xref ref-type="bibr" rid="B58">Abou Heleika et al., 2018</xref>). The low SOC content (1.1%) and pH values that ranged from slightly alkaline (7.79) to moderately alkaline (8.56), can be attributed to the arid nature of the study area (low precipitation) accompanied by the domination of basic cations such as magnesium (Mg<sup>2&#x2b;</sup>) and calcium (Ca<sup>2&#x2b;</sup>) (<xref ref-type="bibr" rid="B1">Al-Soghir et al., 2022</xref>). These findings are in line with those reported that soils in this area of Egypt have low SOC content and high pH (7.73&#x2013;9.45) (e.g., <xref ref-type="bibr" rid="B1">Al-Soghir et al., 2022</xref>; <xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>). More importantly, the significant impact of the intensive agricultural practices of using mineral fertilizers, pesticides, and polluted irrigation water (<xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>). The El-Moheet drainage is considered a pollution source as some farmers use such water for irrigating their crops due to the deficiency of clean irrigation water (<xref ref-type="bibr" rid="B58">Abou Heleika et al., 2018</xref>; <xref ref-type="bibr" rid="B19">Hammam et al., 2022</xref>).</p>
<p>The estimation of PTEs using Vis-NIRS mainly relies on the indirect relationship with active soil components (e.g., clay, OC, and Fe). PTEs have no direct spectral features in the Vis-NIR region. Still, they can be detected indirectly through correlation with spectrally active soil attributes such as clay, OC, and Fe in the Vis-NIR region (<xref ref-type="bibr" rid="B10">Cipullo et al., 2019</xref>; <xref ref-type="bibr" rid="B35">Nawar et al., 2020</xref>). The correlation with total Fe can be the major predictive mechanism (<xref ref-type="bibr" rid="B53">Wu et al., 2005</xref>). Thus, the reflectance spectra can indirectly assess the PTEs concentrations in soil samples based on the correlation between contaminant concentrations and spectrally active soil attributes. For example, a considerable positive correlation of Fe with the tested PTEs concentrations (e.g., Cd, Cu, Zn, As, Pb, and Mn) has been reported (<xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>), suggesting that PTEs were closely bonded to Fe (<xref ref-type="bibr" rid="B53">Wu et al., 2005</xref>). In the current study, the spectrally active soil component (Fe) strongly correlated with the PTEs (Cd, Cu, Pb, Zn, and Cr) with a medium to strong correlation (<italic>r</italic> &#x3d; 0.24&#x2013;0.63). The correlation between the SOC and PTEs was weak to medium positive (<italic>r</italic> &#x3d; 0.09&#x2013;0.42). These results indicate that Fe more significantly influenced the prediction of PTEs contents from spectra than other soil components such as SOC (<xref ref-type="bibr" rid="B26">Khosravi et al., 2018</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). Therefore, in arid conditions (low SOC) as the case of current research, the role of Fe in estimating PTEs can be larger than the SOC and can significantly influence soil spectra (<xref ref-type="bibr" rid="B52">Wu et al., 2007</xref>).</p>
<p>Estimating soil PTEs using Vis&#x2013;NIRS was reported with different modelling accuracy (<xref ref-type="bibr" rid="B53">Wu et al., 2005</xref>, <xref ref-type="bibr" rid="B52">2007</xref>; <xref ref-type="bibr" rid="B10">Cipullo et al., 2019</xref>; <xref ref-type="bibr" rid="B21">Hong et al., 2019</xref>; <xref ref-type="bibr" rid="B17">Gholizadeh et al., 2020</xref>). The strong correlations between PTEs and Fe&#x2013;have a spectral response, and are responsible for the viability of the Vis&#x2013;NIRS estimation of PTEs in soils (<xref ref-type="bibr" rid="B23">Kemper and Sommer, 2002</xref>; <xref ref-type="bibr" rid="B5">Ara&#xfa;jo et al., 2014</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). Wu et al. (2007) successfully predicted low levels of PTEs in agricultural soils with descending order of prediction accuracy Ni &#x3e; Cr &#x3e; Co &#x3e; Cd. They attributed such order of accuracy to the order of their correlation coefficients with Fe. The high performance of Cr and Pb predictions has been confirmed based on 2,160 samples used to assess selected PTEs (Cr, Cu, Pb, Zn, and Al) in forest soils in the Czech Republic (<xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). The current study found different modeling performances for the PTEs models (<xref ref-type="table" rid="T2">Table 2</xref>), with the order Cr &#x3e; Pb &#x3e; Cd &#x3e; Cu &#x3e; Co &#x3e; Zn. The fair prediction of Co, Cu, and Zn can be explained by the fact that a greater proportion of those elements penetrate and precipitate from the solution phase in the soil. As a result, a large amount of these PTEs are allocated naturally in the soil profile by an independent process, making them undetectable when scanning surface soil samples by Vis-NIRS (<xref ref-type="bibr" rid="B44">Sim&#xf3;n et al., 2001</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>).</p>
<p>Based on the RPD classes of model performance (<xref ref-type="bibr" rid="B48">Viscarra Rossel et al., 2006</xref>), the prediction performance for Cr, Pb, and Cd, based on UVE-PLS, belonged to good to very good classes (RPD &#x3d; 1.86&#x2013;2.48). Cu, Co, and Zn models&#x2019; performance is considered fair (RPD &#x3d; 1.41&#x2013;1.78). Our results are in agreement with those reported by <xref ref-type="bibr" rid="B55">Xu et al. (2019)</xref>, who have reported the highest accuracy for Cr with a correlation coefficient (&#x3c1;c) of 0.80, RPD of 1.63, and RMSEP of 9.47, which is higher than those obtained in the current study (8.29&#xa0;mg&#xa0;kg<sup>&#x2212;1</sup>). Our results are better than those reported by <xref ref-type="bibr" rid="B39">O&#x27;Rourke et al. (2016)</xref>, using a prediction set of 80 soil samples analysed with a full range Vis-NIRS coupled with a cubist modelling method for the prediction of the total concentration of 40 soil elements. The authors reported poor results for Cr with R<sup>2</sup> &#x3d; 0.26, RMSEP &#x3d; 24.93&#xa0;mg kg<sup>&#x2212;1</sup>, and RPIQ &#x3d; 0.44), with a concentration range from 5.56 to 221.7&#xa0;mg kg<sup>&#x2212;1</sup>. In this context, <xref ref-type="bibr" rid="B47">Todorova et al. (2014)</xref>, who used 124 soil samples and full-range Vis-NIRS coupled with PLSR, reported excellent to poor prediction for Cu, Zn, Pb, Ni, and Cr with R<sup>2</sup>, RPD, and RMSEP of 0.89&#x2013;0.38, 3.16&#x2013;1.3, and 4.75&#x2013;21.35&#xa0;mg kg<sup>&#x2212;1</sup>, respectively. They found the highest accuracy for Cu and the worst for Cr. Also, poor results have been reported for estimating Cr based on PLSR and full spectral range (<xref ref-type="bibr" rid="B56">Xu et al., 2021</xref>). The authors reported R<sup>2</sup> &#x3d; 0.45, RPD &#x3d; 1.38, and RMSEP of 20.33&#xa0;mg kg<sup>&#x2212;1</sup>, and they suggested using appropriate dimensionality reduction methods for optimal results.</p>
<p>The first derivative provided higher-performance PTEs models than the second derivative when estimating PTEs in soils using spectral derivatives (<xref ref-type="bibr" rid="B34">Nawar et al., 2016</xref>; <xref ref-type="bibr" rid="B9">Chakraborty et al., 2017</xref>). The first derivative improves the spectral data while keeping the information&#x2019;s continuity and integrity, while the second derivative adds more noise to the spectral information (<xref ref-type="bibr" rid="B34">Nawar et al., 2016</xref>; <xref ref-type="bibr" rid="B26">Khosravi et al., 2018</xref>). In this study, however, the performance of the models-based derivative spectra was higher than those of the models-based first derivative when estimating the target key PTEs using the selected wavelengths. The advantage of using the second derivative can be attributed to the capabilities of the second derivative to improve the spectral resolution, reduce the background noise, and pick out spectral peaks (<xref ref-type="bibr" rid="B28">Kong et al., 2018</xref>). Finding the spectral peaks that overlap is the critical part of the second derivative ability to improve the resolution of second derivative spectra, which helps to find out where the samples are different and locate the best wavelengths close to the spectral peaks (<xref ref-type="bibr" rid="B41">Saranwong et al., 2004</xref>). In this context, high-order derivatives showed better capabilities than low-order derivatives in assessing PTEs (Cr, Cu, and Ag) (<xref ref-type="bibr" rid="B56">Xu et al., 2021</xref>). Therefore, the above reasons may explain why models based second derivative outperformed the models based on the first derivative spectra when using variable selection techniques.</p>
<p>In the current study, the usefulness and benefit of feature selection algorithms, UVE and SA, were tested for selecting optimal variables for PTEs prediction. Using the feature selection algorithms resulted in removing the redundant and unuseful variables, reducing the spectral data dimension, selecting fewer variables of the spectral data, and avoiding potential over-fitting (<xref ref-type="bibr" rid="B49">Vohland et al., 2011</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). The UVE set fewer spectral variables in this research and provided better results than full-range spectra and SA (<xref ref-type="table" rid="T2">Table 2</xref>). The superiority of UVE over SA has been reported (<xref ref-type="bibr" rid="B6">Balabin and Smirnov, 2011</xref>; <xref ref-type="bibr" rid="B38">Ong et al., 2022</xref>) and explained that UVE subjectively removes variables based on either high noise or low detector response in an automated way for the calibration of Vis-NIR data (<xref ref-type="bibr" rid="B8">Centner et al., 1996</xref>). Besides, the strength of UVE is due to the selection of the valuable wavelengths based on the stability of each wavelength evaluated by the calculated regression coefficients within the PLSR calibration (<xref ref-type="bibr" rid="B38">Ong et al., 2022</xref>). Therefore, the variables selection-based UVE method helps to develop robust and stable spectral predictive models (<xref ref-type="bibr" rid="B6">Balabin and Smirnov, 2011</xref>).</p>
<p>However, compared to most of the mentioned studies, the prediction samples used in this study were relatively small (n &#x3d; 20). The dataset significantly impacted the accuracy of calibration and prediction of soil properties, e.g., OC and PTEs (<xref ref-type="bibr" rid="B37">Nawar and Mouazen, 2017</xref>; <xref ref-type="bibr" rid="B15">Gholizadeh et al., 2021</xref>). The number of samples influences the model accuracy (<xref ref-type="bibr" rid="B11">Douglas et al., 2018</xref>; <xref ref-type="bibr" rid="B10">Cipullo et al., 2019</xref>), leading to various counterintuitive and unfamiliar side effects, leading to non-reasonable performance (<xref ref-type="bibr" rid="B11">Douglas et al., 2018</xref>; <xref ref-type="bibr" rid="B36">Nawar et al., 2019</xref>), with a general trend that the prediction capability increases with the sample&#x2019;s number. However the limitation of the prediction set in the current study, the results obtained here are better for some elements, e.g., Cr, Pb, and Cd, and comparable to others, e.g., Cu, Co, and Zn. One of the reasons for the better prediction results of PTEs could be a good distribution of samples with minimum and maximum values (<xref ref-type="table" rid="T2">Table 2</xref>). Therefore, a good pre-selection of the calibration and the prediction sets with the wide range of concentration will improve prediction performance. Consequently, further investigation of the impact of a different dataset is needed to determine the optimal sample size and concentration range for enhancing the prediction accuracy obtained in this work, particularly for Cu, Co, and Zn.</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>5 Conclusion</title>
<p>The current research investigates the potential of visible and near-infrared spectroscopy (Vis-NIRS) combined with PLSR and feature selection algorithms (uninformative variable elimination (UVE) and simulated annealing (SA)) to predict the PTEs (Cd, Cu, Co, Cu, Pb, and Zn) contents in agriculture soils under the arid conditions in a polluted area in Egypt. The results showed that (i) the Vis-NIRS has the potential for predicting the tested PTEs, (ii) the full-range spectral dataset (FR) resulted in very poor models performance for all the PTEs (R<sup>2</sup> &#x3c; 0.40), (iii) the predictions obtained from the selected variables of the spectra based on UVE algorithm combined with PLSR (UVE-PLS) improved all the PTEs models&#x2019; accuracies (0.46 &#x2264; R<sup>2</sup> &#x2264; 0.74) comparing with the models based the full spectral range, (iv) Cr models resulted in the highest performance for all methods (FR-PLS, SA-PLS, and UVE-PLS), and (v) the prediction results based on UVE-PLS for Cr, Pb, and Cd can be classified as very good (RPD values of 2.48, 2.03, and 1.86, respectively), and less accurate predictions (good to fair) obtained for Cu, Co, and Zn (RPD values of 1.78, 1.68, and 1.41, respectively). The results suggested that Vis-NIRS combined with the PLSR and feature selection algorithm (UVE) is promising for screening PTEs in agricultural soils. Future research should focus on testing these findings on larger datasets with a wider range of contents from different sites to be combined with other powerful machine learning methods such as cubist and random forest.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s6">
<title>Data availability statement</title>
<p>Data are available from the authors upon request.</p>
</sec>
<sec id="s7">
<title>Author contributions</title>
<p>Conceptualization, SN and EM; methodology, SN, EM, and AH; software, SN; validation, SN; formal analysis, SN, EM, and AH; investigation, SN, SE-E, WM, AH, and EM; data curation, SE-E, AH, EM, and WM; visualization, SN; writing the paper draft, SN; review and editing the manuscript, SN, EM, SE-E, WM, NR, and AH. All authors contributed to the article and approved the submitted version.</p>
</sec>
<ack>
<p>The authors would like to acknowledge the soil and water department, faculty of agriculture, Suez Canal University, Egypt. The authors also acknowledge the soil department, faculty of agriculture, Minia University, and the National Authority for Remote Sensing and Space Sciences for laboratory analyses and support. This paper has been supported by the RUDN University Strategic Academic Leadership Program.</p>
</ack>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abou Heleika</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ismail</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ahmed</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Delineation of contamination zone using geophysical and hydrogeochemical methods around the El Moheet drain in the El Minia district, Upper Egypt</article-title>. <source>Arab. J. Geosci.</source> <volume>11</volume> (<issue>20</issue>), <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1007/s12517-018-3927-2</pub-id>
</citation>
</ref>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Al-Soghir</surname>
<given-names>M. M. A.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>El-Desoky</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Awad</surname>
<given-names>A. A. M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Comprehensive assessment of soil chemical properties for land reclamation purposes in the toshka area, Egypt</article-title>. <source>Sustain. Switz.</source> <volume>14</volume> (<issue>23</issue>), <fpage>15611</fpage>. <pub-id pub-id-type="doi">10.3390/su142315611</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andersen</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Bro</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Variable selection in regression-a tutorial</article-title>. <source>J. Chemom.</source> <volume>24</volume> (<issue>11&#x2013;12</issue>), <fpage>728</fpage>&#x2013;<lpage>737</lpage>. <pub-id pub-id-type="doi">10.1002/cem.1360</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andries</surname>
<given-names>J. P. M.</given-names>
</name>
<name>
<surname>Vander Heyden</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Buydens</surname>
<given-names>L. M. C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Improved variable reduction in partial least squares modelling based on Predictive-Property-Ranked Variables and adaptation of partial least squares complexity</article-title>. <source>Anal. Chim. Acta</source> <volume>705</volume> (<issue>1&#x2013;2</issue>), <fpage>292</fpage>&#x2013;<lpage>305</lpage>. <pub-id pub-id-type="doi">10.1016/j.aca.2011.06.037</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andries</surname>
<given-names>J. P. M.</given-names>
</name>
<name>
<surname>Vander Heyden</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Buydens</surname>
<given-names>L. M. C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Improved variable reduction in partial least squares modelling by Global-Minimum Error Uninformative-Variable Elimination</article-title>. <source>Anal. Chim. Acta</source> <volume>982</volume>, <fpage>37</fpage>&#x2013;<lpage>47</lpage>. <pub-id pub-id-type="doi">10.1016/j.aca.2017.06.001</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ara&#xfa;jo</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Dematt&#xea;</surname>
<given-names>J. A. M.</given-names>
</name>
<name>
<surname>Vicente</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Soil contaminated with chromium by tannery sludge and identified by vis-NIR-mid spectroscopy techniques</article-title>. <source>Int. J. Remote Sens.</source> <volume>35</volume> (<issue>10</issue>), <fpage>3579</fpage>&#x2013;<lpage>3593</lpage>. <pub-id pub-id-type="doi">10.1080/01431161.2014.907940</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Balabin</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Smirnov</surname>
<given-names>S. V.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Variable selection in near-infrared spectroscopy: Benchmarking of feature selection methods on biodiesel data</article-title>. <source>Anal. Chim. Acta</source> <volume>692</volume> (<issue>1&#x2013;2</issue>), <fpage>63</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1016/j.aca.2011.03.006</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bruemmer</surname>
<given-names>G. W.</given-names>
</name>
<name>
<surname>Gerth</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Herms</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Heavy metal species, mobility and availability in soils</article-title>. <source>Z. F&#xfc;r Pflanzenern&#xe4;hrung Und Bodenkd.</source> <volume>149</volume> (<issue>4</issue>), <fpage>382</fpage>&#x2013;<lpage>398</lpage>. <pub-id pub-id-type="doi">10.1002/jpln.19861490404</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Centner</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Massart</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>De Noord</surname>
<given-names>O. E.</given-names>
</name>
<name>
<surname>De Jong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Vandeginste</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Sterna</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Elimination of uninformative variables for multivariate calibration</article-title>. <source>Anal. Chem.</source> <volume>68</volume> (<issue>21</issue>), <fpage>3851</fpage>&#x2013;<lpage>3858</lpage>. <pub-id pub-id-type="doi">10.1021/ac960321m</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chakraborty</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Weindorf</surname>
<given-names>D. C.</given-names>
</name>
<name>
<surname>Deb</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Paul</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Choudhury</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Rapid assessment of regional soil arsenic pollution risk via diffuse reflectance spectroscopy</article-title>. <source>Geoderma</source> <volume>289</volume>, <fpage>72</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/J.GEODERMA.2016.11.024</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cipullo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Campo-Moreno</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Coulon</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Predicting bioavailability change of complex chemical mixtures in contaminated soils using visible and near-infrared spectroscopy and random forest regression</article-title>. <source>Sci. Rep.</source> <volume>9</volume> (<issue>1</issue>), <fpage>4492</fpage>&#x2013;<lpage>4503</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-41161-w</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Douglas</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Alamar</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Coulon</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Rapid prediction of total petroleum hydrocarbons concentration in contaminated soil using vis-NIR spectroscopy and regression techniques</article-title>. <source>Sci. Total Environ.</source> <volume>616&#x2013;617</volume>, <fpage>147</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2017.10.323</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ertlen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Schwartz</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Trautmann</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Webster</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Brunet</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Discriminating between organic matter in soil from grass and forest by near-infrared spectroscopy</article-title>. <source>Eur. J. Soil Sci.</source> <volume>61</volume> (<issue>2</issue>), <fpage>207</fpage>&#x2013;<lpage>216</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2389.2009.01219.x</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Forina</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lanteri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Oliveros</surname>
<given-names>M. C. C.</given-names>
</name>
<name>
<surname>Millan</surname>
<given-names>C. P.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Selection of useful predictors in multivariate calibration</article-title>. <source>Anal. Bioanal. Chem.</source> <volume>380</volume> (<issue>3</issue>), <fpage>397</fpage>&#x2013;<lpage>418</lpage>. <pub-id pub-id-type="doi">10.1007/s00216-004-2768-x</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gauchi</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Chagnon</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Comparison of selection methods of explanatory variables in PLS regression with application to manufacturing process data</article-title>. <source>Chemom. Intelligent Laboratory Syst.</source> <volume>58</volume> (<issue>2</issue>), <fpage>171</fpage>&#x2013;<lpage>193</lpage>. <pub-id pub-id-type="doi">10.1016/S0169-7439(01)00158-7</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gholizadeh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Coblinski</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Saberioon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ben-Dor</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Dr&#xe1;bek</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Dematt&#xea;</surname>
<given-names>J. A. M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Vis&#x2013;nir and xrf data fusion and feature selection to estimate potentially toxic elements in soil</article-title>. <source>Sensors</source> <volume>21</volume> (<issue>7</issue>), <fpage>2386</fpage>. <pub-id pub-id-type="doi">10.3390/s21072386</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gholizadeh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Saberioon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ben-Dor</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bor&#x16f;vka</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Monitoring of selected soil contaminants using proximal and remote sensing techniques: Background, state-of-the-art and future perspectives</article-title>. <source>Crit. Rev. Environ. Sci. Technol.</source> <volume>48</volume> (<issue>3</issue>), <fpage>243</fpage>&#x2013;<lpage>278</lpage>. <pub-id pub-id-type="doi">10.1080/10643389.2018.1447717</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gholizadeh</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Saberioon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ben-Dor</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Viscarra Rossel</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Bor&#x16f;vka</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Modelling potentially toxic elements in forest soils with vis&#x2013;NIR spectra and learning algorithms</article-title>. <source>Environ. Pollut.</source> <volume>267</volume>, <fpage>115574</fpage>. <pub-id pub-id-type="doi">10.1016/j.envpol.2020.115574</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Barimah</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Shujat</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ouyang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Simultaneous quantification of active constituents and antioxidant capability of green tea using NIR spectroscopy coupled with swarm intelligence algorithm</article-title>. <source>LWT</source> <volume>129</volume>, <fpage>109510</fpage>. <pub-id pub-id-type="doi">10.1016/j.lwt.2020.109510</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hammam</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>W. S.</given-names>
</name>
<name>
<surname>Sayed</surname>
<given-names>S. E. E.</given-names>
</name>
<name>
<surname>Kucher</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>E. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Assessment of soil contamination using gis and multi-variate analysis: A case study in el-minia governorate, Egypt</article-title>. <source>Agronomy</source> <volume>12</volume> (<issue>5</issue>), <fpage>1197</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy12051197</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Qing</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Rapid determination of low heavy metal concentrations in grassland soils around mining using vis&#x2013;NIR spectroscopy: A case study of inner Mongolia, China</article-title>. <source>Sensors</source> <volume>21</volume> (<issue>9</issue>), <fpage>3220</fpage>. <pub-id pub-id-type="doi">10.3390/s21093220</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Estimating lead and zinc concentrations in peri-urban agricultural soils through reflectance spectroscopy: Effects of fractional-order derivative and random forest</article-title>. <source>Sci. Total Environ.</source> <volume>651</volume>, <fpage>1969</fpage>&#x2013;<lpage>1982</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2018.09.391</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Xiong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Feature selection method based on partial least squares and analysis of traditional chinese medicine data</article-title>. <source>Comput. Math. Methods Med.</source> <volume>2019</volume>, <fpage>9580126</fpage>. <pub-id pub-id-type="doi">10.1155/2019/9580126</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalivas</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sutter</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Global optimization by simulated annealing with wavelength selection for ultraviolet-visible spectrophotometry</article-title>. <source>Anal. Chem.</source> <volume>61</volume> (<issue>18</issue>), <fpage>2024</fpage>&#x2013;<lpage>2030</lpage>. <pub-id pub-id-type="doi">10.1021/ac00193a006</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kemper</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sommer</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Estimate of heavy metal contamination in soils after a mining accident using reflectance spectroscopy</article-title>. <source>Environ. Sci. Technol.</source> <volume>36</volume> (<issue>12</issue>), <fpage>2742</fpage>&#x2013;<lpage>2747</lpage>. <pub-id pub-id-type="doi">10.1021/es015747j</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kennard</surname>
<given-names>R. W.</given-names>
</name>
<name>
<surname>Stone</surname>
<given-names>L. A.</given-names>
</name>
</person-group> (<year>1969</year>). <article-title>Computer aided design of experiments</article-title>. <source>Technometrics</source> <volume>11</volume> (<issue>1</issue>), <fpage>137</fpage>&#x2013;<lpage>148</lpage>. <pub-id pub-id-type="doi">10.1080/00401706.1969.10490666</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y. Z.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y. G.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Health risks of heavy metals in contaminated soils and food crops irrigated with wastewater in Beijing, China</article-title>. <source>Environ. Pollut.</source> <volume>152</volume> (<issue>3</issue>), <fpage>686</fpage>&#x2013;<lpage>692</lpage>. <pub-id pub-id-type="doi">10.1016/j.envpol.2007.06.056</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khosravi</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Doulati Ardejani</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Yousefi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Aryafar</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Monitoring soil lead and zinc contents via combination of spectroscopy with extreme learning machine and other data mining methods</article-title>. <source>Geoderma</source> <volume>318</volume>, <fpage>29</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2017.12.025</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kirkpatrick</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gelatt</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Vecchi</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>Optimization by simulated annealing</article-title>. <source>Science</source> <volume>220</volume> (<issue>4598</issue>), <fpage>671</fpage>&#x2013;<lpage>680</lpage>. <pub-id pub-id-type="doi">10.1126/science.220.4598.671</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Detection of Sclerotinia stem rot on oilseed rape (Brassica napus L) leaves using hyperspectral imaging</article-title>. <source>Sensors Switz.</source> <volume>18</volume> (<issue>6</issue>), <fpage>1764</fpage>. <pub-id pub-id-type="doi">10.3390/s18061764</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kooistra</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wehrens</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Buydens</surname>
<given-names>L. M. C.</given-names>
</name>
<name>
<surname>Leuven</surname>
<given-names>R. S. E. W.</given-names>
</name>
<name>
<surname>Nienhuis</surname>
<given-names>P. H.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Possibilities of soil spectroscopy for the classification of contaminated areas in river floodplains</article-title>. <source>ITC J.</source> <volume>3</volume> (<issue>4</issue>), <fpage>337</fpage>&#x2013;<lpage>344</lpage>. <pub-id pub-id-type="doi">10.1016/S0303-2434(01)85041-8</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Ba</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessing heavy metal concentrations in earth-cumulic-orthic-anthrosols soils using Vis-NIR spectroscopy transform coupled with chemometrics</article-title>. <source>Spectrochimica Acta - Part A Mol. Biomol. Spectrosc.</source> <volume>226</volume>, <fpage>117639</fpage>. <pub-id pub-id-type="doi">10.1016/j.saa.2019.117639</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zhen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Rapid detection of carbon-nitrogen ratio for anaerobic fermentation feedstocks using near-infrared spectroscopy combined with BiPLS and GSA</article-title>. <source>Appl. Opt.</source> <volume>58</volume> (<issue>18</issue>), <fpage>5090</fpage>. <pub-id pub-id-type="doi">10.1364/ao.58.005090</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Study on the prediction of soil heavy metal elements content based on visible near-infrared spectroscopy</article-title>. <source>Spectrochimica Acta - Part A Mol. Biomol. Spectrosc.</source> <volume>199</volume>, <fpage>43</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1016/j.saa.2018.03.040</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mayhoub</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Azzam</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>A survey on the assessment of wind energy potential in Egypt</article-title>. <source>Renew. Energy</source> <volume>11</volume> (<issue>2</issue>), <fpage>235</fpage>&#x2013;<lpage>247</lpage>. <pub-id pub-id-type="doi">10.1016/S0960-1481(96)00113-9</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Mehmood</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Saeb&#x00F8;</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liland</surname>
<given-names>K. H.</given-names>
</name>
</person-group> (<year>2020</year>). <source>Comparison of variable selection methods in partial least squares regression</source>. <pub-id pub-id-type="doi">10.1002/cem.3226</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Buddenbaum</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hill</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kozak</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M. A. M. A. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Estimating the soil clay content and organic matter by means of different calibration methods of vis-NIR diffuse reflectance spectroscopy</article-title>. <source>Soil Tillage Res.</source> <volume>155</volume>, <fpage>510</fpage>&#x2013;<lpage>522</lpage>. <pub-id pub-id-type="doi">10.1016/j.still.2015.07.021</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cipullo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Douglas</surname>
<given-names>R. K. K.</given-names>
</name>
<name>
<surname>Coulon</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The applicability of spectroscopy methods for estimating potentially toxic elements in soils: State-of-the-art and future trends</article-title>. <source>Appl. Spectrosc. Rev.</source> <volume>55</volume> (<issue>7</issue>), <fpage>525</fpage>&#x2013;<lpage>557</lpage>. <pub-id pub-id-type="doi">10.1080/05704928.2019.1608110</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Delbecque</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Declercq</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>De Smedt</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Finke</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Verdoodt</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Can spectral analyses improve measurement of key soil fertility parameters with X-ray fluorescence spectrometry?</article-title> <source>Geoderma</source> <volume>350</volume>, <fpage>29</fpage>&#x2013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2019.05.002</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Comparison between random forests, artificial neural networks and gradient boosted machines methods of on-line Vis-NIR spectroscopy measurements of soil total nitrogen and total carbon</article-title>. <source>Sensors Switz.</source> <volume>17</volume> (<issue>10</issue>), <fpage>2428</fpage>&#x2013;<lpage>2449</lpage>. <pub-id pub-id-type="doi">10.3390/s17102428</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ong</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Tung</surname>
<given-names>I. C.</given-names>
</name>
<name>
<surname>Chiu</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Tsai</surname>
<given-names>I. L.</given-names>
</name>
<name>
<surname>Shih</surname>
<given-names>H. C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Determination of aflatoxin B1 level in rice (Oryza sativa L) through near-infrared spectroscopy and an improved simulated annealing variable selection method</article-title>. <source>Food control.</source> <volume>136</volume>, <fpage>108886</fpage>. <pub-id pub-id-type="doi">10.1016/j.foodcont.2022.108886</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>O&#x2019;Rourke</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Minasny</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Holden</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>McBratney</surname>
<given-names>A. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Synergistic use of vis-NIR, MIR, and XRF spectroscopy for the determination of soil geochemistry</article-title>. <source>Soil Sci. Soc. Am. J.</source> <volume>80</volume> (<issue>4</issue>), <fpage>888</fpage>&#x2013;<lpage>899</lpage>. <pub-id pub-id-type="doi">10.2136/sssaj2015.10.0361</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Page</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>Keeney</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>1982</year>). <source>Methods of soil analysis: Part 2, chemical and microbiological properties agronomy series No 9</source>. <publisher-loc>Madison, WI</publisher-loc>: <publisher-name>American Society of Agronomy</publisher-name>.</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saranwong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sornsrivichai</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kawano</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Prediction of ripe-stage eating quality of mango fruit from its harvest quality measured nondestructively by near infrared spectroscopy</article-title>. <source>Postharvest Biol. Technol.</source> <volume>31</volume> (<issue>2</issue>), <fpage>137</fpage>&#x2013;<lpage>145</lpage>. <pub-id pub-id-type="doi">10.1016/j.postharvbio.2003.08.007</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Savitzky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Golay</surname>
<given-names>M. J. E.</given-names>
</name>
</person-group> (<year>1964</year>). <article-title>Smoothing and differentiation of data by simplified least squares procedures</article-title>. <source>Anal. Chem.</source> <volume>36</volume> (<issue>8</issue>), <fpage>1627</fpage>&#x2013;<lpage>1639</lpage>. <pub-id pub-id-type="doi">10.1021/ac60214a047</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Proximal and remote sensing techniques for mapping of soil contamination with heavy metals</article-title>. <source>Appl. Spectrosc. Rev.</source> <volume>53</volume> (<issue>10</issue>), <fpage>783</fpage>&#x2013;<lpage>805</lpage>. <pub-id pub-id-type="doi">10.1080/05704928.2018.1442346</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sim&#xf3;n</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mart&#xed;n</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ortiz</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Garc&#xed;a</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Fern&#xe1;ndez</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fern&#xe1;ndez</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2001</year>). <article-title>Soil pollution by oxidation of tailings from toxic spill of a pyrite mine</article-title>. <source>Sci. Total Environ.</source> <volume>279</volume> (<issue>1&#x2013;3</issue>), <fpage>63</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1016/S0048-9697(01)00726-4</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="web">
<collab>Soil Survey Staff</collab> (<year>2022</year>). <source>Keys to soil taxonomy</source>. <edition>13th Edn</edition>. <publisher-name>USDA-Natural Resources Conservation Service</publisher-name>.</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spiegelman</surname>
<given-names>C. H.</given-names>
</name>
<name>
<surname>McShane</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Goetz</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Motamedi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yue</surname>
<given-names>Q. L.</given-names>
</name>
<name>
<surname>Cot&#xe9;</surname>
<given-names>G. L.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Theoretical justification of wavelength selection in PLS calibration: Development of a new algorithm</article-title>. <source>Anal. Chem.</source> <volume>70</volume> (<issue>1</issue>), <fpage>35</fpage>&#x2013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1021/ac9705733</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Swierenga</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>De Groot</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>De Weijer</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Derksen</surname>
<given-names>M. W. J.</given-names>
</name>
<name>
<surname>Buydens</surname>
<given-names>L. M. C.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Improvement of PLS model transferability by robust wavelength selection</article-title>. <source>Chemom. Intelligent Laboratory Syst.</source> <volume>41</volume> (<issue>2</issue>), <fpage>237</fpage>&#x2013;<lpage>248</lpage>. <pub-id pub-id-type="doi">10.1016/S0169-7439(98)00055-0</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Todorova</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mouazen</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Lange</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Atanassova</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Potential of near-infrared spectroscopy for measurement of heavy metals in soil as affected by calibration set size</article-title>. <source>Water, Air, Soil Pollut.</source> <volume>225</volume> (<issue>8</issue>), <fpage>2036</fpage>&#x2013;<lpage>2057</lpage>. <pub-id pub-id-type="doi">10.1007/s11270-014-2036-4</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Viscarra Rossel</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Walvoort</surname>
<given-names>D. J. J.</given-names>
</name>
<name>
<surname>McBratney</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Janik</surname>
<given-names>L. J.</given-names>
</name>
<name>
<surname>Skjemstad</surname>
<given-names>J. O.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Visible, near infrared, mid infrared or combined diffuse reflectance spectroscopy for simultaneous assessment of various soil properties</article-title>. <source>Geoderma</source> <volume>131</volume> (<issue>1&#x2013;2</issue>), <fpage>59</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2005.03.007</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vohland</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Besold</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hill</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fr&#xfc;nd</surname>
<given-names>H. C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Comparing different multivariate calibration methods for the determination of soil organic carbon pools with visible to near infrared spectroscopy</article-title>. <source>Geoderma</source> <volume>166</volume> (<issue>1</issue>), <fpage>198</fpage>&#x2013;<lpage>205</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2011.08.001</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walkley</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Black</surname>
<given-names>I. A.</given-names>
</name>
</person-group> (<year>1934</year>). <article-title>An examination of the degtjareff method for determining soil organic matter, and a proposed modification of the chromic acid titration method</article-title>. <source>Soil Sci.</source> <volume>37</volume> (<issue>1</issue>), <fpage>29</fpage>&#x2013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1097/00010694-193401000-00003</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wold</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sj&#xf6;str&#xf6;m</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Eriksson</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>PLS-regression: A basic tool of chemometrics</article-title>. <source>Chemom. Intelligent Laboratory Syst.</source> <volume>58</volume> (<issue>2</issue>), <fpage>109</fpage>&#x2013;<lpage>130</lpage>. <pub-id pub-id-type="doi">10.1016/S0169-7439(01)00155-1</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>A mechanism study of reflectance spectroscopy for investigating heavy metals in soils</article-title>. <source>Soil Sci. Soc. Am. J.</source> <volume>71</volume> (<issue>3</issue>), <fpage>918</fpage>&#x2013;<lpage>926</lpage>. <pub-id pub-id-type="doi">10.2136/sssaj2006.0285</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Possibilities of reflectance spectroscopy for the assessment of contaminant elements in suburban soils</article-title>. <source>Appl. Geochem.</source> <volume>20</volume> (<issue>6</issue>), <fpage>1051</fpage>&#x2013;<lpage>1059</lpage>. <pub-id pub-id-type="doi">10.1016/j.apgeochem.2005.01.009</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiaobo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jiewen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Povey</surname>
<given-names>M. J. W.</given-names>
</name>
<name>
<surname>Holmes</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hanpin</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Variables selection methods in near-infrared spectroscopy</article-title>. <source>Anal. Chim. Acta</source> <volume>667</volume>, <fpage>14</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1016/j.aca.2010.03.048</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Viscarra Rossel</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Biswas</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>X-ray fluorescence and visible near infrared sensor fusion for predicting soil chromium content</article-title>. <source>Geoderma</source> <volume>352</volume>, <fpage>61</fpage>&#x2013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2019.05.036</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lv</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Estimation of heavy metals in agricultural soils using vis-nir spectroscopy with fractional-order derivative and generalized regression neural network</article-title>. <source>Remote Sens.</source> <volume>13</volume> (<issue>14</issue>), <fpage>2718</fpage>. <pub-id pub-id-type="doi">10.3390/rs13142718</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>F. F.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>M. T. F.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>X. L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Identification of soil heavy metal sources from anthropogenic activities and pollution assessment of Fuyang County, China</article-title>. <source>Environ. Monit. Assess.</source> <volume>154</volume> (<issue>1&#x2013;4</issue>), <fpage>439</fpage>&#x2013;<lpage>449</lpage>. <pub-id pub-id-type="doi">10.1007/s10661-008-0410-7</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>