<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1656095</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2025.1656095</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Estimation of heavy metals in agricultural soil using near-infrared spectroscopy with the improved evolutionary method</article-title>
<alt-title alt-title-type="left-running-head">Hong et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2025.1656095">10.3389/fenvs.2025.1656095</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Hong</surname>
<given-names>Shaoyong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1471140"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Siyuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lin</surname>
<given-names>Miaoquan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing - original draft</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Meng</surname>
<given-names>Fangxiu</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal Analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hou</surname>
<given-names>Can</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Validation" vocab-term-identifier="https://credit.niso.org/contributor-roles/validation/">Validation</role>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Huazhou</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1048634"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &#x26; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/">Writing - review and editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
</contrib>
</contrib-group>
<aff id="aff1">
<label>1</label>
<institution>School of Artificial Intelligence, Guangzhou Huashang College</institution>, <city>Guangzhou</city>, <country country="CN">China</country>
</aff>
<aff id="aff2">
<label>2</label>
<institution>Mathematics Teaching and Research Group, Rongxian Experimental Senior Middle School</institution>, <city>Yulin</city>, <country country="CN">China</country>
</aff>
<aff id="aff3">
<label>3</label>
<institution>School of Mathematics and Statistics, Guilin University of Technology</institution>, <city>Guilin</city>, <country country="CN">China</country>
</aff>
<author-notes>
<corresp id="c001">
<label>&#x2a;</label>Correspondence: Huazhou Chen, <email xlink:href="mailto:hzchengut@foxmail.com">hzchengut@foxmail.com</email>
</corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-10">
<day>10</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2025</year>
</pub-date>
<volume>13</volume>
<elocation-id>1656095</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>27</day>
<month>11</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>12</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Hong, Zhang, Lin, Meng, Hou and Chen.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Hong, Zhang, Lin, Meng, Hou and Chen</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-10">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Monitoring and real-time detection of soil heavy metal pollution are crucial to ensuring the safety of agricultural food products. Conventional methods for determining heavy metal concentrations require substantial time and costs. This study investigates intelligent modeling approaches for online detection of heavy metal contamination in soils. Based on Internet of Things communication, large&#x2010;scale near-infrared (NIR) spectral data were collected from distributed sensors for federated analysis.</p>
</sec>
<sec>
<title>Methods</title>
<p>In chemometric studies, the improved binary firefly algorithm (IBFA) is proposed for evolutionary variable selection, and the modified method of maximum information coefficient (MMIC) is designed to estimate the nonlinear correlation of unevenly distributed samples. Experimental soil data are collected from the Karst geology on the north side of Guangxi ZAR, China. The NIR calibration model is established by fusion of the IBFA and the MMIC methods (denoted as IBFA &#x002B; MMIC). The fusion model is applied for quantitative prediction targeting of four heavy metals in the Karst soil samples.</p>
</sec>
<sec>
<title>Results</title>
<p>The IBFA &#x002B; MMIC model can observe correlation coefficients higher than 0.9 and the lowest prediction errors during model training. It is tested with the correlations very close to 0.9, while the testing errors are acceptably low. These results outperform the counterpart models established by other cross combinations of firefly algorithm (FA)/IBFA and maximum information coefficient (MIC)/MMIC.</p>
</sec>
<sec>
<title>Discussion</title>
<p>The proposed modeling methodology is effectively validated for quantitative NIR analysis of different heavy metals in Karst soil data. Meanwhile, it provides critical technical support for the federated analytical performance of distributed sensing data, thereby facilitating precision soil management practices.</p>
</sec>
</abstract>
<kwd-group>
<kwd>distributed sensing</kwd>
<kwd>evolutionary method</kwd>
<kwd>firefly algorithm</kwd>
<kwd>modified maximum information coefficient</kwd>
<kwd>near-infrared spectroscopy</kwd>
<kwd>soil heavy metal</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was financially supported by the National Natural Science Foundation of China (62365008) and Special Project in Key Areas of Ordinary Universities and Colleges in Guangdong Province (2023ZDZX4069).</funding-statement>
</funding-group>
<counts>
<fig-count count="6"/>
<table-count count="4"/>
<equation-count count="7"/>
<ref-count count="46"/>
<page-count count="13"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Environmental Informatics and Remote Sensing</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<label>1</label>
<title>Introduction</title>
<p>Heavy metal contamination of soil is a grave and growing environmental concern (<xref ref-type="bibr" rid="B43">Zhang X. et al., 2024</xref>). Heavy metals enter the soil through fertilizer applications, mining activities, and sewage discharge, gradually accumulating and leading to contamination (<xref ref-type="bibr" rid="B18">Latosinska et al., 2021</xref>). Due to its long-term environmental persistence without degradation, this kind of contamination has detrimental effects on the ecosystem, resulting in a cascading impact on soil quality. Then, it is passed along the food chain, ultimately delivering harmful risks to human health (<xref ref-type="bibr" rid="B30">Perkovic et al., 2022</xref>). The monitoring and real-time detection of soil heavy metal pollution is essential for protecting the safety of agricultural foods. The conventional method for determining soil heavy metal concentrations is chemical analysis. This involves collecting soil samples from the field and measuring the target heavy metal content under laboratory settings and conditions. However, this process is time-consuming, laborious, and expensive; the number of available soil samples is limited. It does not lend itself to performing high-quality online studies to identify heavy metal variation.</p>
<p>Over the past few decades, near-infrared (NIR) spectral technology, which can obtain spectral responses from the samples and yield detailed spectral information about agricultural objects, has been developing (<xref ref-type="bibr" rid="B13">De Souza et al., 2016</xref>; <xref ref-type="bibr" rid="B28">Nawar et al., 2023</xref>). Supported by the Fourier transform (FT) technique, the NIR signals are amplified to a magnitude range that is easily distinguished. The FT-NIR sensing signal boasts wide-ranging continuous spectral bands with high resolution, providing rapid and precise estimation of soil sample components (<xref ref-type="bibr" rid="B27">Mortada et al., 2021</xref>). Specifically, the FT-NIR spectra of soil (scanning range at 10,000&#x2013;4,000&#xa0;cm cm<sup>&#x2212;1</sup>) reflect multiple cumulative properties of soil heterogeneous matters, such as soil minerals, nutrient targets, and moisture (<xref ref-type="bibr" rid="B19">Leenen et al., 2019</xref>). With the increasing demand for spectral prospecting, the &#x201c;big data&#x201d; concept of FT-NIR sensing of large quantities of soil samples enables the identification of the inherent components and extra substances in soil (including heavy metals).</p>
<p>When spectral sensing technology was initially applied for field detection of soil compositions, many studies focused on spectrally active soil analytes like organic carbon, nutrient components, iron oxides, and clay minerals (<xref ref-type="bibr" rid="B29">Paltseva et al., 2022</xref>; <xref ref-type="bibr" rid="B2">Al Maliki et al., 2018</xref>). These analytes have a direct relation with the spectral response. The main task is to identify the NIR bands to interpret their spectral features, which is feasible (<xref ref-type="bibr" rid="B40">Zhang et al., 2019</xref>). In contrast to the spectrally active analytes, heavy metal concentrations are more difficult to estimate using the spectral data in the NIR region due to their low concentrations in soil (<xref ref-type="bibr" rid="B17">Han et al., 2021</xref>). Successful prediction of soil heavy metals is carried out by laboratory experiments under preset ideal conditions (<xref ref-type="bibr" rid="B46">Zukowska et al., 2021</xref>). Because of the complex mechanism for the retrieval of soil contaminants, laboratory-based spectroscopy is often used to explore the relationship between an individual heavy metal and the spectrum (<xref ref-type="bibr" rid="B3">Ali et al., 2023</xref>).</p>
<p>Compared to laboratory measurements, the Internet of Things (IoT) framework endorses immediate sensing of soil properties with portable devices, which is quicker and less expensive (<xref ref-type="bibr" rid="B12">Dattatreya et al., 2024</xref>). Considering the spectral variation caused by field conditions, several studies focus on the extraction of spectral features from the online measured data (<xref ref-type="bibr" rid="B37">Wang et al., 2022</xref>). In combination with machine learning algorithms, calibration models are improved in terms of prediction accuracy and model stability (<xref ref-type="bibr" rid="B38">Zayani et al., 2023</xref>). These successful studies have provided a robust foundation for the development of adaptive learning methods in estimating soil metals with NIR technology (<xref ref-type="bibr" rid="B22">Li et al., 2024</xref>). In combination with the IoT framework, the spectra with internal signal pre-correction by the instrument are used to detect various alien contaminating elements over a large area of distributed spot-line geographical locations (<xref ref-type="bibr" rid="B7">Chen et al., 2020</xref>). Under the &#x201c;big data&#x201d; situation, the chemometric methods must be enhanced in fusion with some adaptive learning strategies to fill the gap between laboratory analysis and the IoT-based federal analysis of distributed sensing data. Prompt detection based on analysis of data distributed over a wide range of locations is currently emerging. It has become a new state-of-the-art application of NIR technology to support rapid detection and instant analysis in fields of agricultural and environmental sciences.</p>
<p>The term &#x201c;distributed sensing technique&#x201d; refers to real-time monitoring and immediate response by deploying multiple sensors to deal with fertilization, irrigation, defect treatment, and other relevant issues (<xref ref-type="bibr" rid="B1">Acharya and Kogure, 2023</xref>). The sensors are usually small or portable with low power support and communicate wirelessly with each other or with a base station (<xref ref-type="bibr" rid="B6">Chamara et al., 2023</xref>). Distributed sensing is convenient and useful for simultaneous data collection, good protection of data privacy, reduction of the system complexity, operating with low costs, and provision of a comprehensive view of the environment being monitored (<xref ref-type="bibr" rid="B5">Bourechak et al., 2023</xref>). There have been a few initial applications of rapid NIR/FT-NIR detection to environmental targets in food and agriculture. These studies use traditional distributed sensing and a data aggregation algorithm to search for solutions to field problems (<xref ref-type="bibr" rid="B16">Gouda et al., 2024</xref>; <xref ref-type="bibr" rid="B8">Chen et al., 2025</xref>). However, data aggregation requires substantial computing and communication resources. This scheme has poor performance in responding to instant and precise responses from portable smart devices such as tablets and mobile phones under the IoT framework (<xref ref-type="bibr" rid="B45">Zhou et al., 2024</xref>). In a scenario of rapid spectral analysis over a large area of geographical spots, computing resources must encode and decode the transmitted data frequently, which increases the energy consumption of the distributed sensing system (<xref ref-type="bibr" rid="B4">Babbar et al., 2025</xref>).</p>
<p>Evolutionary learning is a type of intelligent algorithm that can ease the computing intensity of encoding and decoding aggregated data. The principle of evolution depends on iterative population processes, which perform with superior individuals selected for reproduction and inferior ones eliminated in swarm selection (<xref ref-type="bibr" rid="B42">Zhang R. et al., 2024</xref>). The application of NIR spectroscopy in an IoT scenario partially benefits from this advanced property of evolutionary learning. In recent years, several evolutionary learning methods have become widely used and well-validated for NIR analysis (<xref ref-type="bibr" rid="B41">Zhang et al., 2021</xref>; <xref ref-type="bibr" rid="B23">Liu et al., 2024</xref>). As a result, studies that employed NIR/FT-NIR spectroscopy adopted evolutionary learning methods for quantitative or qualitative predictions on different soil metal substances in various land-use types. For example, <xref ref-type="bibr" rid="B34">Surawijaya et al. (2023)</xref> employed particle swarm optimization (PSO) to explore an optimized design of a fabricated grating structure, aiming for maximum NIR absorption. This was done to improve the calibration models for predicting silicon (Si) concentration in soil samples. <xref ref-type="bibr" rid="B33">Song et al. (2022)</xref> developed a binary grey wolf optimization (GWO) method combined with a PLS model for the determination of arsenic (As) and Pb concentrations in soil. This approach reduced the dimensionality of input data and increased the NIR predictive performance. Among various evolutionary algorithms, the firefly algorithm (FA) conducts global search across the entire space by imitating the brightness attraction mechanism among fireflies. The FA outperforms other evolutionary methods in several aspects. First, compared with other evolutionary algorithms, the FA must only adjust a small number of representative parameters (such as brightness attractiveness, light absorption coefficient, and step factor); it has stronger robustness in global optimization than GA, PSO, or GWO (<xref ref-type="bibr" rid="B9">Chhabra et al., 2021</xref>). Second, FA can achieve more flexible optimization according to specific problems, which is conducive to balancing the adaptive search ability and secondary development of the algorithm (<xref ref-type="bibr" rid="B14">Devi et al., 2022</xref>). Third, the FA algorithm can find better solutions within fewer iterations, and its optimization convergence speed is faster than other evolutionary algorithms (<xref ref-type="bibr" rid="B35">Tao et al., 2024</xref>). Many published articles have used the classical FA as an important chemometric support for NIR quantitative or qualitative analysis. For instance, it is used for the estimation of different ripening stages of apples, for the detection of nutrient freshness of tomato plants, and for the quality determination of grape seed oil (<xref ref-type="bibr" rid="B31">Pourdarbani et al., 2022</xref>; <xref ref-type="bibr" rid="B20">Li, 2021</xref>). FA has not yet been used as a machine learning tool for NIR detection of soil nutrition or pollutant substances. In addition, the previous works referring to evolutionary learning methods were conducted using laboratory or local field spectra, not for distributed sensing analysis in an IoT scenario involving &#x201c;big data&#x201d; over a large area of diverse geographical locations.</p>
<p>This study explored an intelligent modeling method in conjunction with NIR spectral technology to support the distributed sensing of heavy metal contamination of soils over a range of geographically different areas. In order to specify the distributed spectral sensing data for the estimation of soil heavy metal, we used a set of portable <italic>in situ</italic> sensors, which allows for the detection conditions more representative of the real-world field conditions than laboratory settings. Based on the IoT framework, federal analysis of the big spectral data collected from different sensors enabled us to identify the informative features by examining the relations between the NIR data and the targeted heavy metal concentrations. For chemometric studies, we investigate the improvement of evolutionary learning methods, taking FA as an example, to validate the practicability of the selection of spectral features, thereby bolstering a novel study branch of NIR technology for model optimization by the population iterative evolution. Considering the integrated impact of the complexity of soil properties and the diversity of distributed sensing, the extraction of spectral features from the entire variable set can be challenging. Nonetheless, we developed an improved FA method through binary discretization and further combined it with the information correlation method for fusion modeling. The proposed methodology aims to identify the key NIR spectral information for a good prediction of heavy metal concentrations in soil. Implementing intelligent modeling strategies is expected to effectively monitor heavy metal contamination in the soil environment and provide valuable technical support to assist the efforts in soil management.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2-1">
<label>2.1</label>
<title>Distributed sensing and data preparation</title>
<sec id="s2-1-1">
<label>2.1.1</label>
<title>Site selection and equipment settings</title>
<p>The Guangxi Zhuang Autonomous Region (Guangxi ZAR) is a mountainous and water-rich provincial administrative region in south China (see <xref ref-type="fig" rid="F1">Figure 1a</xref>), which has a mild climate and fertile soil resources and produces a variety of crops, vegetables, and fruits. However, on the north side of Guangxi ZAR, the mountains are mostly Karst geology (<xref ref-type="bibr" rid="B21">Li et al., 2023</xref>). The topography of Karst is characterized by ruggedness of the surface, variety of landforms, richness of bio-ecology, and poor nutrition in soils (<xref ref-type="bibr" rid="B44">Zhang Z. et al., 2024</xref>). To protect the fertile soils in the Karst circumstance, a total of 14 regular farmland areas were selected on the north side of the Guangxi ZAR for the study of distributed sensing detection of heavy metal concentrations. The 14 areas were distributed at the geographical locations identified in <xref ref-type="fig" rid="F1">Figure 1b</xref>. To balance distributed sensing and precise analysis, we used 12 spectral sensors in each location, which were set at an average squared distance for direct contact with the topsoil surface. The 12 <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mo>&#xd7;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> 14 sensors are all well connected to a cloud platform, from which the sensing operation can be remotely controlled.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Fourteen geographical locations of the selected farmland areas (the red points in <bold>(b)</bold>) for distributed sensing analysis. <bold>(a)</bold> Location of Guangxi ZAR in China. <bold>(b)</bold> Geographical locations of the selected areas.</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g001.tif">
<alt-text content-type="machine-generated">Two-panel map showing: (a) Guangxi Zhuang Autonomous Region (ZAR) highlighted in green in southern China, with the rest of China outlined in white and labeled; (b) detailed map of Guangxi ZAR with red dots numbered one to fourteen indicating selected geographical study locations, latitude and longitude lines, and a distance scale in kilometers.</alt-text>
</graphic>
</fig>
<p>The spectral sensing operation was conducted in late summer when the effects of moisture, roughness, and noise interference were minimized. Before spectral sensing, we visited the fields several times and kept in contact with the landowners and managers to acquire basic knowledge about the environmental conditions of the field. No rain fell on the day when we performed our sensing work, nor was any rain recorded 2&#xa0;days before. Technically, we learned that the drier soil surfaces can be caused by the season&#x2019;s climate factors. The properties of the upper mask of topsoil are mostly affected by boundary reasons other than the soil components. Thus, we removed approximately 1 inch of the upper mask and then collected the soil spectra using sensing devices. The sensors received the FT-NIR spectral data on heavy metal concentrations, as well as the other component properties.</p>
</sec>
<sec id="s2-1-2">
<label>2.1.2</label>
<title>The spectral data and the chemical records</title>
<p>The <italic>in situ</italic> FT-NIR spectra were measured in the fields using a micro FC-025-2&#xa0;TE spectrometer (ARCoptix Inc., Neuchatel, Switzerland) across the band of 10,000&#x2013;4,000&#xa0;cm cm<sup>&#x2212;1</sup> with 4&#xa0;cm cm<sup>&#x2212;1</sup> resolution. A total of 1,512 discrete variables were recorded for each sensing location. Over the 168 distributed spots, we collected the spectrometer detection results as the spectral sensing responses of 168 topsoil samples. We collected five repeated spectral measurements for each sample and computed the average data from the available spectral data.</p>
<p>Additionally, during the <italic>in situ</italic> measurement of the spectral, soil samples were collected from 1 inch below the surface, to a depth of 4 inches from each position, and delivered to the laboratory for the determination of the heavy metals of Zn, chromium (Cr), copper (Cu), and Pb. In the laboratory, the samples were oven-dried at 45&#xa0;&#xb0;C, gently crushed, and sieved to a fine earth fraction no larger than 2&#xa0;mm in diameter. The contents of Zn, Cr, Cu, and Pb were measured using the inductively coupled plasma atomic emission spectroscopy (ICP-AES) method (<xref ref-type="bibr" rid="B11">Daftsis and Zachariadis, 2008</xref>). <xref ref-type="table" rid="T1">Table 1</xref> shows the descriptive statistics of the targeted heavy metal concentrations for the distributed sensing samples, consisting of the maximum, the minimum, the mean value, the median, standard deviation (SD), coefficient of variation (CV), excess kurtosis (eKT), and skewness. These values are the aggregated amounts of the metals in the distributed samples.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Descriptive statistics of the four targeted heavy metal concentrations (mg/kg) of the sensing data.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Content</th>
<th align="center">Max</th>
<th align="center">Min</th>
<th align="center">Mean</th>
<th align="center">Median</th>
<th align="center">SD</th>
<th align="center">CV</th>
<th align="center">eKT</th>
<th align="center">Skewness</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Zn</td>
<td align="center">594.13</td>
<td align="center">32.33</td>
<td align="center">210.29</td>
<td align="center">124.43</td>
<td align="center">160.19</td>
<td align="center">0.59</td>
<td align="center">0.88</td>
<td align="center">1.25</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">148.93</td>
<td align="center">63.69</td>
<td align="center">112.05</td>
<td align="center">16.10</td>
<td align="center">112.61</td>
<td align="center">0.14</td>
<td align="center">0.41</td>
<td align="center">&#x2212;0.45</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">86.79</td>
<td align="center">29.41</td>
<td align="center">60.46</td>
<td align="center">13.30</td>
<td align="center">60.09</td>
<td align="center">0.22</td>
<td align="center">&#x2212;0.46</td>
<td align="center">0.09</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">104.38</td>
<td align="center">14.31</td>
<td align="center">58.29</td>
<td align="center">22.23</td>
<td align="center">51.81</td>
<td align="center">0.38</td>
<td align="center">&#x2212;0.57</td>
<td align="center">0.62</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s2-2">
<label>2.2</label>
<title>Methodologies for evolutionary optimization</title>
<p>The distribution of information variables is discretized, so that the search for feature variables is in vital demand. In this case, evolutionary learning methods have the advantage of iteratively refining their solutions and are well-suited to assist in an intelligent search of the variables. Furthermore, the fusion or combination of these selected features can probably enhance the NIR model performance by recurrent evolution of the information about the analytes from the diverse distributed sensing data.</p>
<sec id="s2-2-1">
<label>2.2.1</label>
<title>Improvement of the FA method</title>
<p>The FA is a classical evolutionary learning method. It was originally developed by simulating the biological characteristics of firefly luminescence. In the swarm gathering principle, the attraction between fireflies decreases as their distance increases. The fireflies spontaneously fly toward the brightest individual to search for a superior position (<xref ref-type="bibr" rid="B39">Zeng et al., 2024</xref>). A &#x201c;0&#x2013;1&#x201d; mapping rule can simplify the FA method as a binary processing scheme (<xref ref-type="bibr" rid="B15">Ervural and Hakli, 2023</xref>). The binary FA (BFA) method is used to choose some discrete spectral variables at random, obeying the 0&#x2013;1 encoding rule, to generate a set of discrete NIR feature variables that correspond to candidate responses to the several target metal concentrations.</p>
<p>In the FA story, suppose that there is a total of <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> individuals in the firefly population. The population evolves no more than <inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> times. With statistical explanation, we denote the <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>th individual at the <inline-formula id="inf5">
<mml:math id="m5">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th iteration as <inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>, which is discretized as a vector in <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mi>p</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> length, that is, <inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>p</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. For improvement, BFA generates a 0&#x2013;1 valued regulation index <inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:msubsup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>p</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> with the same length as <inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>. The BFA presents the crossover calculation as the dot product of <inline-formula id="inf11">
<mml:math id="m11">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#xb7;</mml:mo>
<mml:msubsup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>. By randomization, the individual is decomposed as in binary coding, to produce a new individual for mutation and selection.</p>
<p>For the <inline-formula id="inf12">
<mml:math id="m12">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>th iteration, the candidate wavenumbers that are identified by BFA are used as feature variables to establish models for the spectral sensing data. The fitness function originally defined by the brightness of firefly individuals is currently re-defined numerically as root mean square error (RMSE), directly linking to the model prediction effect.</p>
<p>To smooth the iteration, a threshold value is set in the fitness function to formulate the evolutionary individual, namely,<disp-formula id="e1">
<mml:math id="m13">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>k</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xb7;</mml:mo>
<mml:mo>&#x394;</mml:mo>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mi>l</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#xb7;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.5</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>for&#x2009;</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <inline-formula id="inf13">
<mml:math id="m14">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the renewed candidate evolutionary individual after the <inline-formula id="inf14">
<mml:math id="m15">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th iteration; <inline-formula id="inf15">
<mml:math id="m16">
<mml:mrow>
<mml:mo>&#x394;</mml:mo>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represents the stochastic change by iteration; <inline-formula id="inf16">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the threshold, and <inline-formula id="inf17">
<mml:math id="m18">
<mml:mrow>
<mml:msub>
<mml:mi>k</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf18">
<mml:math id="m19">
<mml:mrow>
<mml:msub>
<mml:mi>l</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the tunable regularization parameters defined in the same dimension to <inline-formula id="inf19">
<mml:math id="m20">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>Next, the renewed candidate individual <inline-formula id="inf20">
<mml:math id="m21">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> crosses over with <inline-formula id="inf21">
<mml:math id="m22">
<mml:mrow>
<mml:msubsup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and is further mapped by the fitness function to identify the evolutionary individual for the selection of informative variables. The evolution of the population is determined as follows:<disp-formula id="e2">
<mml:math id="m23">
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="{" close="" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x7c;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x7c;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x7c;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2265;</mml:mo>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x7c;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>where <inline-formula id="inf22">
<mml:math id="m24">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#xb7;</mml:mo>
<mml:msubsup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf23">
<mml:math id="m25">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#xb7;</mml:mo>
<mml:msubsup>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> for <inline-formula id="inf24">
<mml:math id="m26">
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>The primary BFA method is improved by applying the specially designed fitness function <inline-formula id="inf25">
<mml:math id="m27">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xb7;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> to launch the adaptive optimization for variable selection from the renewed candidate sets of <inline-formula id="inf26">
<mml:math id="m28">
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
</mml:msubsup>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>g</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi>N</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</inline-formula>. The iterative evolution terminates when it reaches the preset maxima and obtains the combination of the selected data. As the variables evolve through iterative learning, we develop a simple and concise model that is optimized with the endorsement of the fusion of these selected variables, so that the model can be improved to have high prediction accuracy. For convenience, the improved BFA method is hereafter denoted as IBFA.</p>
<p>In IBFA, the 0&#x2013;1 binary coding indicates that the variable is selected only if it is encoded as 1. Thus, the mapping function is important for variable selection. To speed up the convergence of iterations, a special function is proposed for adaptive mapping, which endorses high probabilities of individuals being encoded as 1 in the early iteration stage, and then the probabilities decrease as the iteration continues. Theoretically, this kind of mapping function should be concave and monotonically decreasing. We define our mapping function as follows:<disp-formula id="e3">
<mml:math id="m29">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mo>&#x7c;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3bc;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#xb7;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
<mml:mo>&#xb7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xb7;</mml:mo>
<mml:mo>&#x2061;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>where <inline-formula id="inf27">
<mml:math id="m30">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> represents the undergoing participants of variables at the <inline-formula id="inf28">
<mml:math id="m31">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>th iteration; <inline-formula id="inf29">
<mml:math id="m32">
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the preset total number of rounds of iteration; <inline-formula id="inf30">
<mml:math id="m33">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is a parameter that denotes the probability of individual variables being encoded as 1. It controls the 0&#x2013;1 binary division ratio, where <inline-formula id="inf31">
<mml:math id="m34">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> of the variables are encoded as 1, and <inline-formula id="inf32">
<mml:math id="m35">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> as 0. For instance, let <inline-formula id="inf33">
<mml:math id="m36">
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0.7</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf34">
<mml:math id="m37">
<mml:mrow>
<mml:mi>G</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>100</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>, we could have the iterative curve for the adaptive function available for the fixed participation of <inline-formula id="inf35">
<mml:math id="m38">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
<mml:mo>&#x2261;</mml:mo>
<mml:mn>1.92</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (see <xref ref-type="fig" rid="F2">Figure 2</xref>). The function serves for fast identification of feature variables at a faster iterative convergence.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Curve for the adaptive mapping function <inline-formula id="inf36">
<mml:math id="m39">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="" close="|" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g002.tif">
<alt-text content-type="machine-generated">Line graph showing the adaptive function f(g) on the vertical axis and iteration g on the horizontal axis, with values decreasing smoothly from approximately 0.7 at iteration zero to roughly 0.3 at iteration one hundred.</alt-text>
</graphic>
</fig>
</sec>
<sec id="s2-2-2">
<label>2.2.2</label>
<title>Information correlation for distributed sensing data</title>
<p>Evolutionary learning methods are advantageous for selecting spectral features. However, evolution optimization methods cannot handle the correlation and collinearity of variables. Confronting the situation of distributed sensing, the spectral data from different locations are inherently related to soil metal contamination, so they are typically correlated with each other. It is necessary to conduct a preliminary correlation analysis on the IoT-based cloud platform for all collected samples.</p>
<p>According to the NIR spectral property, more information is included in the wavelengths with higher correlations to the targeted metal concentration. Correlation analysis is a statistical measure that can tolerate data uncertainties (<xref ref-type="bibr" rid="B26">Mana and Pizzocaro, 2021</xref>). To effectively analyze the distributed data, we attempt to set a threshold for the correlation coefficient. This allows us to expand the candidate spectral range in accordance with the known chemical knowledge of the heavy metals. Subsequently, we can select the wavelength variables with higher correlation coefficients that exceed this threshold across the entire sensing dataset. These variables are prospectively available for enhancing models in an IoT environment where data are distributed.</p>
<p>The maximum information coefficient (MIC) is a special index that tells reliable correlations in terms of nonlinear correlation and uneven sample distribution (<xref ref-type="bibr" rid="B25">Luo et al., 2024</xref>). In theory, the original MIC algorithm is only concerned with selecting highly correlated variables but does not consider the influence of collinearity among the distributed data. To address this issue, we include a projection subtraction method to reduce the collinear effects on correlation analysis, so that the MIC algorithm is modified. The modified MIC algorithm (denoted as MMIC) is designed specifically for spectral sensing, with the aim of capturing a wide range of functional, interesting associations to provide a scoring indicator similar to the coefficient of determination in a regression model.</p>
<p>In detailed designs, we first make a fast computation of the MIC values between the raw wavenumber variables and the orthogonal variables. Suppose the raw dataset is denoted as <inline-formula id="inf37">
<mml:math id="m40">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and the orthogonal variable dataset as <inline-formula id="inf38">
<mml:math id="m41">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. A scatter plot is generated based on the two related variable sets, and the plotted map is divided into <inline-formula id="inf39">
<mml:math id="m42">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> small grids. The mutual information is calculated between every two grids over all of the possible one-to-one pair grid combinations, formulated as <xref ref-type="disp-formula" rid="e4">Equations 4</xref>, <xref ref-type="disp-formula" rid="e5">5</xref>: <disp-formula id="e4">
<mml:math id="m43">
<mml:mrow>
<mml:msub>
<mml:mi>H</mml:mi>
<mml:mi>max</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mi>g</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:munder>
<mml:mi>max</mml:mi>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
<disp-formula id="e5">
<mml:math id="m44">
<mml:mrow>
<mml:mtext>MIC</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>H</mml:mi>
<mml:mi>max</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mi>g</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>log</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:munder>
<mml:mi>min</mml:mi>
<mml:mi>j</mml:mi>
</mml:munder>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>where <inline-formula id="inf40">
<mml:math id="m45">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xb7;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#xb7;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> represents a function that monitors the frequency of the counted data points appearing in the <inline-formula id="inf41">
<mml:math id="m46">
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>-th targeted grid for <inline-formula id="inf42">
<mml:math id="m47">
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#x2026;</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>Specifically, a forward-loop encoding procedure is designed to complete the cycling selection of projections to generate the dataset of <inline-formula id="inf43">
<mml:math id="m48">
<mml:mrow>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>. For the <inline-formula id="inf44">
<mml:math id="m49">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>th round (going through the total of <inline-formula id="inf45">
<mml:math id="m50">
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> iterations), the projection is defined as <xref ref-type="disp-formula" rid="e6">Equation 6</xref>:<disp-formula id="e6">
<mml:math id="m51">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>o</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mn>0</mml:mn>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#xb7;</mml:mo>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#xb7;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
</mml:msup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>where <inline-formula id="inf46">
<mml:math id="m52">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mn>0</mml:mn>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> is the raw variable that has the largest MIC value, and <inline-formula id="inf47">
<mml:math id="m53">
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> represents the variable in the <italic>j</italic>th grid. To widen the possible selection range of candidate feature variables, we set a threshold <inline-formula id="inf48">
<mml:math id="m54">
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> to expand the range for candidate features. By the modification of dual factors of projection subtraction and threshold control, the MMIC value is refined as <xref ref-type="disp-formula" rid="e7">Equation 7</xref>:<disp-formula id="e7">
<mml:math id="m55">
<mml:mrow>
<mml:mtext>MMIC</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:munder>
<mml:mi>max</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:mfenced open="{" close="}" separators="|">
<mml:mrow>
<mml:mtext>MIC</mml:mtext>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#xb7;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>where <inline-formula id="inf49">
<mml:math id="m56">
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the upper bound of the available gridded area, which is usually valued as <inline-formula id="inf50">
<mml:math id="m57">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
<mml:mo>/</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf51">
<mml:math id="m58">
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> represents the threshold that is functional to expand the spectral range for IBFA iterative search.</p>
<p>In this way, the MMIC algorithm step-by-step performs correlation judgment by a series of dynamic MMIC values that are calculated by the embodiment of projection subtraction during the iterative data refining for the distributed sensing acquisition. Technically, we fuse the MMIC algorithm with the IBFA evolutionary method to identify the informative wavenumbers/variables.</p>
</sec>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<label>3</label>
<title>Results and discussion</title>
<p>For model establishment, training, and optimization, the 168 soil samples detected at different spot locations are partitioned into two functional sets, one for modeling and the other for testing. We used a usual partitioning ratio of 3:1 to determine the number of samples for the modeling set and for the testing set. The WSPXY method (<xref ref-type="bibr" rid="B36">Tian et al., 2019</xref>) is employed to make the division, so that the selected modeling samples are representative. Accordingly, the determination coefficient (R) and the root mean square error (RMSE) for modeling are denoted as R<sub>M</sub> and RMSE<sub>M</sub> and as R<sub>T</sub> and RMSE<sub>T</sub> for testing.</p>
<sec id="s3-1">
<label>3.1</label>
<title>Data pre-processing and model evaluation mode</title>
<p>The raw spectral sensing data are accompanied by noisy interference. To reduce the influence of multiple kinds of noise, the data were subjected to various pre-processing methods using the MATLAB toolbox. The pre-processing algorithms included Savitzky&#x2013;Golay (SG), discrete wavelet transformation (DWT), multiplicative scatter correction (MSC), standard normal variate (SNV), and their pair combinations.</p>
<p>To ensure the pre-processed models are not affected by multivariate aggregation, we employed the classical PLS method to perform pre-modeling training, with the computing mode by 5-fold cross-validation over the 168 soil samples. The cross-validation accuracy was evaluated by the determination coefficient (R<sub>CV</sub>) and the root mean square error (RMSE<sub>CV</sub>). In the PLS process, the participant variables are the latent variables developed by a linear combination of the initial wavenumbers. The model runs and evaluates itself for the number of latent variables changing from 1 to 20. The optimal number was selected with the release of R<sub>CV</sub> and RMSE<sub>CV</sub>. To ensure model stability, the procedure was repeated 20 times, and the average results of R<sub>CV</sub> and RMSE<sub>CV</sub> are observed for each of the heavy metal targets. After discarding the less significant results, the best pre-processing observations of the data are shown in <xref ref-type="table" rid="T2">Table 2</xref> for comparative selection of the best and refined noise reduction method.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Comparison of eight different solo and combined pre-processing algorithms based on 5-fold cross-validation for the spectral sensing data using classical PLS regression.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Method</th>
<th colspan="4" align="center">R<sub>CV</sub>
</th>
<th colspan="4" align="center">RMSE<sub>CV</sub>
</th>
</tr>
<tr>
<th align="center">Zn</th>
<th align="center">Cr</th>
<th align="center">Cu</th>
<th align="center">Pb</th>
<th align="center">Zn</th>
<th align="center">Cr</th>
<th align="center">Cu</th>
<th align="center">Pb</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Raw</td>
<td align="center">0.688</td>
<td align="center">0.671</td>
<td align="center">0.691</td>
<td align="center">0.713</td>
<td align="center">41.77</td>
<td align="center">25.20</td>
<td align="center">12.97</td>
<td align="center">11.91</td>
</tr>
<tr>
<td align="center">SG</td>
<td align="center">0.806</td>
<td align="center">0.730</td>
<td align="center">0.754</td>
<td align="center">0.779</td>
<td align="center">36.77</td>
<td align="center">23.07</td>
<td align="center">11.36</td>
<td align="center">10.48</td>
</tr>
<tr>
<td align="center">DWT</td>
<td align="center">0.824</td>
<td align="center">0.728</td>
<td align="center">0.752</td>
<td align="center">0.777</td>
<td align="center">34.61</td>
<td align="center">22.18</td>
<td align="center">10.60</td>
<td align="center">10.43</td>
</tr>
<tr>
<td align="center">MSC</td>
<td align="center">0.777</td>
<td align="center">0.710</td>
<td align="center">0.744</td>
<td align="center">0.756</td>
<td align="center">38.24</td>
<td align="center">22.51</td>
<td align="center">11.58</td>
<td align="center">10.90</td>
</tr>
<tr>
<td align="center">SNV</td>
<td align="center">0.796</td>
<td align="center">0.721</td>
<td align="center">0.732</td>
<td align="center">0.769</td>
<td align="center">37.31</td>
<td align="center">22.08</td>
<td align="center">11.87</td>
<td align="center">10.64</td>
</tr>
<tr>
<td align="center">SG &#x2b; MSC</td>
<td align="center">0.779</td>
<td align="center">0.758</td>
<td align="center">0.759</td>
<td align="center">0.784</td>
<td align="center">36.60</td>
<td align="center">21.88</td>
<td align="center">10.74</td>
<td align="center">9.73</td>
</tr>
<tr>
<td align="center">SG &#x2b; SNV</td>
<td align="center">0.799</td>
<td align="center">0.735</td>
<td align="center">0.790</td>
<td align="center">0.812</td>
<td align="center">36.26</td>
<td align="center">20.59</td>
<td align="center">11.26</td>
<td align="center">9.49</td>
</tr>
<tr>
<td align="center">DWT &#x2b; MSC</td>
<td align="center">0.849</td>
<td align="center">0.768</td>
<td align="center">0.783</td>
<td align="center">0.817</td>
<td align="center">34.13</td>
<td align="center">20.48</td>
<td align="center">11.41</td>
<td align="center">10.34</td>
</tr>
<tr>
<td align="center">DWT &#x2b; SNV</td>
<td align="center">0.834</td>
<td align="center">0.765</td>
<td align="center">0.804</td>
<td align="center">0.820</td>
<td align="center">33.28</td>
<td align="center">20.88</td>
<td align="center">10.33</td>
<td align="center">9.87</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>
<xref ref-type="table" rid="T2">Table 2</xref> indicates that the best refined pre-processing methods are different for each heavy metal concentration. Aiming to identify the minimum RMSE<sub>CV</sub> with a corresponding appropriate high value of R<sub>CV</sub>, we learned that the pair-combination methods have better pre-processing results for the distributed sensing soil samples. The best pre-processing method is DWT &#x2b; SNV, which released higher R<sub>CV</sub> values and lower RMSE<sub>CV</sub> than the other pre-processing methods for Zn, Cu, and Pb. Although the DWT &#x2b; SNV method did not observe the best values for Cr (the minimum RMSE<sub>CV</sub> or the highest R<sub>CV</sub>), the observed values are very close to the best values.</p>
</sec>
<sec id="s3-2">
<label>3.2</label>
<title>Multivariate analysis by classical PLS</title>
<p>The PLS method performs variable decomposition to generate a series of latent variables obeying the principal component analysis (PCA) principle (<xref ref-type="bibr" rid="B10">Cook, 2022</xref>). The latent variables in the front of the queue have major data information when sorted in descending order according to the variance contribution rate. Then, we can select a few latent variables for tuning the regression model and observing the optimal RMSE values for prediction. The first three latent variables (LV1, LV2, and LV3) account for most of the total variance of the dataset. They explained more than 99% of the total variance in spectral behaviors of the four targeted heavy metal concentrations. The contributions of LV1, LV2, and LV3 are 74.05%, 16.82%, and 8.78%, respectively. In contrast, the remaining latent variables (LVs) contribute much less (&#x3c;1% in all). Thus, we illustrate the LV biplot graph based on the LV1, LV2, and LV3 values (shown in <xref ref-type="fig" rid="F3">Figure 3</xref>). In <xref ref-type="fig" rid="F3">Figure 3</xref>, the samples are divided into three groups (denoted as GRP1, GRP2, and GRP3). The first group is totally consistent with the testing set. The remaining two sets are evenly divided from the modeling set so that they have similar numbers as the first group. The figures show that the distributed samples could be aggregated for uniform modeling according to their spectral properties with the designated groups. Indeed, with more than 90% variance contribution, the LV1&#x2013;LV2 projection scatter plot showed three main clusters of the designated sample partitions with obvious differences in the loadings, which indicates that the FT-NIR spectral signals over the distributed spots are able to quantify metal concentrations. As they inherit most of the spectral information, LV1 and LV2 are selected as the most important feature variables that represent the soil metal properties. Some other latent variables are also included for model refinement.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Coordinates of samples defined in plane projections of the first three latent variables (LV1, LV2, and LV3) from PLS regression.</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g003.tif">
<alt-text content-type="machine-generated">Three scatter plots compare three groups, GRP1 (blue triangles), GRP2 (red circles), and GRP3 (green squares) using latent variables LV1, LV2, and LV3. Each plot displays the separation and clustering of groups along different latent variable axes, with percentage variance explained shown on each axis. A legend on the right identifies the groups by color and shape.</alt-text>
</graphic>
</fig>
<p>Aiming at the four targeted heavy metals of Zn, Cr, Cu, and Pb, we established and trained the calibration models based on the key latent variables, including LV1 and LV2. We identified the optimal calibration models that demonstrated commendable prediction capabilities both for modeling and for testing. Some extracted latent variables other than LV1 and LV2 are tested. <xref ref-type="table" rid="T3">Table 3</xref> shows the prediction results from the optimal model endorsed with their supporting latent variables. All the selected latent variables originate from the raw wavenumber variables based on the full range of 10,000&#xa0;cm<sup>&#x2212;1</sup> to 4,000&#xa0;cm<sup>&#x2212;1</sup>. With interactive comparison among the targeted elements, we can find that the LV-based optimized models effectively predict Zn and Cu concentrations. Their models exhibit high correlation coefficients exceeding 0.88 in the modeling process, with the RMSE<sub>M</sub> lower than 13% of their respective mean values. In contrast, the models for Cr and Pb are less accurate, but they still reach the acceptable performance levels. The testing results are generally inferior to the modeling outputs, providing practical confirmation of the data-driven machine learning mechanism. In addition, we noted that the selected latent variables for each of the targets fall within the first 10 principal components, which indicates that the PLS models established for the FT-NIR prediction of soil heavy metals can be optimized using informative principal variables.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Quantification results by the classical PLS model accompanied by LV selections on multivariate features.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Content</th>
<th rowspan="2" align="center">Selected LVs</th>
<th colspan="3" align="center">Modeling</th>
<th colspan="3" align="center">Testing</th>
</tr>
<tr>
<th align="center">R<sub>M</sub>
</th>
<th align="center">RMSE<sub>M</sub>
</th>
<th align="left">Relative percentage</th>
<th align="center">R<sub>T</sub>
</th>
<th align="center">RMSE<sub>T</sub>
</th>
<th align="left">Relative percentage</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Zn</td>
<td align="center">LV1, LV2, LV3, LV5, and LV8</td>
<td align="center">0.881</td>
<td align="center">24.68</td>
<td align="center">11.7%</td>
<td align="center">0.878</td>
<td align="center">29.92</td>
<td align="center">14.2%</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">LV1, LV2, LV4, and LV5</td>
<td align="center">0.869</td>
<td align="center">14.69</td>
<td align="center">13.1%</td>
<td align="center">0.859</td>
<td align="center">17.13</td>
<td align="center">15.3%</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">LV1, LV2, LV3, LV4, and LV6</td>
<td align="center">0.886</td>
<td align="center">7.54</td>
<td align="center">12.5%</td>
<td align="center">0.867</td>
<td align="center">8.36</td>
<td align="center">13.8%</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">LV1, LV2, LV5, LV7, LV8, and LV10</td>
<td align="center">0.879</td>
<td align="center">7.77</td>
<td align="center">13.3%</td>
<td align="center">0.862</td>
<td align="center">8.78</td>
<td align="center">15.1%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-3">
<label>3.3</label>
<title>IBFA evolutionary learning model</title>
<p>With binary transform and by-threshold improvement strategies, the IBFA evolutionary method was validated for its efficacy in selecting informative variables. In practice, we simultaneously set the inherent evolutionary parameters for both IBFA and FA algorithms. Based on the population that has a total of 60 individuals, the generation of renewed candidate individuals was regulated by the fitness function (see <xref ref-type="disp-formula" rid="e1">Formula 1</xref>), where we set the regularization parameters <inline-formula id="inf52">
<mml:math id="m59">
<mml:mrow>
<mml:msub>
<mml:mi>k</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf53">
<mml:math id="m60">
<mml:mrow>
<mml:msub>
<mml:mi>l</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as changing from 0 to 1, and the threshold was set to an adjustment of <inline-formula id="inf54">
<mml:math id="m61">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b8;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mn>0.97</mml:mn>
<mml:mo>,</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. The iteration process for evolution was regulated with the upper limitation of <inline-formula id="inf55">
<mml:math id="m62">
<mml:mrow>
<mml:mi>G</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>100</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>. In the selection step (see <xref ref-type="disp-formula" rid="e2">Formula 2</xref>), the binary factor <inline-formula id="inf56">
<mml:math id="m63">
<mml:mrow>
<mml:msub>
<mml:mi>u</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was randomly generated as 0&#x2013;1 arrays for each round of iteration but always maintaining the same dimension consistent with <inline-formula id="inf57">
<mml:math id="m64">
<mml:mrow>
<mml:msub>
<mml:mi>z</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>. With the control of the fitness defined by the function of <inline-formula id="inf58">
<mml:math id="m65">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> (see <xref ref-type="disp-formula" rid="e3">Formula 3</xref>), the variables selected by IBFA were regarded as informative and further delivered to re-establish the PLS models.</p>
<p>
<xref ref-type="fig" rid="F4">Figure 4</xref> depicts the iterative optimization processes of IBFA and FA, showcasing the predictive RMSE<sub>M</sub> derived from PLS modeling based on the chosen informative variables. For convenient comparison, the PLS prediction with none of the evolutionary optimization is also shown in the figure. The comparative experiments have substantiated that the involvement of IBFA and FA enhances the efficiency of wavenumber selection. As a result, the swarm-evolved PLS models outperformed the counterpart conventional PLS model. The lowest RMSE<sub>M</sub> is obtained in the IBFA intervened model after &#x223c;70 evolutions by iteration. This revealed that the adaptive mapping function defined by <xref ref-type="disp-formula" rid="e3">Formula 3</xref> appreciably improved the firefly evolutionary effect in combination with the binary discretization strategy. The gradient convergence of the IBFA model appears slightly later than that of FA, which corroborates the fact that local optimization is postponed when using a specially designed fitness function instead of the random mapping. With the best iterative optimization by IBFA, the PLS models were improved to have the lowest RMSE<sub>M</sub> values of 18.768&#xa0;mg/kg, 10.043&#xa0;mg/kg, 5.322&#xa0;mg/kg, and 5.019&#xa0;mg/kg for Zn, Cr, Cu, and Pb, respectively.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Iterative results based on the IBFA&#x2010;involved and the FA&#x2010;involved models (Noted that the black dashed line is with on evolution method, the red solid line is applied with the FA method, and the blue solid line is applied with the IBFA method).</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g004.tif">
<alt-text content-type="machine-generated">Four line charts compare RMSE_M values over 100 iterations for Zn, Cr, Cu, and Pb. Each chart shows three lines: a dashed black line for &#x201C;None&#x201D;, a red line for &#x201C;FA&#x201D;, and a blue line for &#x201C;IBFA&#x201D;. In all subplots, IBFA consistently yields lower RMSE_M than FA and None as iterations increase.</alt-text>
</graphic>
</fig>
<p>The IBFA iteration runs with 0&#x2013;1 binary crossover and selection over the raw variables of the FT-NIR wavenumbers. We identified the feature variables out of the total 1,512 raw wavenumbers for the FT-NIR data modeling on the Zn, Cr, Cu, and Pb elements (see <xref ref-type="fig" rid="F5">Figure 5</xref>). <xref ref-type="fig" rid="F5">Figure 5</xref> shows that the concatenation of the four sets of feature variables for Zn, Cr, Cu, and Pb merged in a total of 493 located wavenumbers. The placements of the 493 wavenumbers are uniformly distributed in the full range of 10,000&#x2013;4,000&#xa0;cm<sup>&#x2212;1</sup>. These feature variables are suitable for optimizing the PLS model to stable prediction results. This validates that the IBFA variable evolution technique is feasible to enhance the PLS model that works with the selected pre-processing method of DWT &#x2b; SNV. Both the distribution of latent variables and the IBFA iterative function are fused to perform variable computation on the spectral detection of soil heavy metal contents. This is an indication that evolution techniques could be largely attributed to the finding and identification of heavy metal contamination at the rough topsoil surface, even though that soil is in &#x201c;Karst fertile&#x201d; status.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>The 493 concatenated wavenumbers (identified by the dashed red lines) selected by the IBFA-involved PLS model for the prediction of Zn, Cr, Cu, and Pb.</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g005.tif">
<alt-text content-type="machine-generated">Line graph showing FT-NIR absorbance versus wavenumber, featuring a smooth black curve labeled as raw spectra, with overlaid colored vertical lines indicating selected feature wavenumbers for Zn (red), Cu (magenta), Cr (blue), and Pb (green).</alt-text>
</graphic>
</fig>
<p>A recent study shows that a distributed sensing of soil surface reduces the FT-NIR reflectance, which may be a drawback of the contribution of the loss of reflectance of metal elements (<xref ref-type="bibr" rid="B24">Lovynska et al., 2024</xref>). Moreover, simultaneous data analysis on a cloud platform may lead to uneven and heterogeneous effects in multivariate computation, thereby affecting the <italic>in situ</italic> spectral sensing output and making the evolutionary module less effective (<xref ref-type="bibr" rid="B32">Russell-Pavier et al., 2023</xref>). We can easily observe that the IBFA iteration has enhanced the PLS prediction results to an optimized level, and they remain stable to the end of the 100 rounds of evolutionary iteration. However, intensive training of the IBFA can lead the model into a local optimization trap, which means that the refined models with 493 selected feature variables are conditionally good and occasionally stable. The models have potential for further enhancement by studying the mutual correlation of information between the endorsed variables. Thus, the proposed MMIC method is employed to improve model stability and to seek a higher R value or a lower RMSE.</p>
</sec>
<sec id="s3-4">
<label>3.4</label>
<title>MMIC improvement for distributed data</title>
<p>To improve model precision, we combine the MMIC method with the IBFA-optimized PLS model for global refinement of feature selection. As the original MIC method accounts for data collinearity, the MMIC method fuses the projection subtraction in variable space and scores the association relationship between variables. In practice, the MMIC algorithm is applied after the IBFA, with the aim of capturing the features from the full range of available IBFA-produced variable space. The MMIC scoring indicator is dynamically evaluated by iterative steps to ensure the selected variables make an interesting contribution to model improvement.</p>
<p>In a deep analysis of the distributed spectral sensing data in a specified area, the MMIC-combined IBFA model was targeted to balance the prediction of the four metal elements of Zn, Cr, Cu, and Pb in the global view; the results are shown in <xref ref-type="table" rid="T4">Table 4</xref>. To examine the practical advantages of the IBFA-combined-MMIC (IBFA &#x2b; MMIC) model, the original FA method and the MIC algorithm are alternatively applied for comparison. <xref ref-type="table" rid="T4">Table 4</xref> shows that the IBFA &#x2b; MMIC model produced fairly good prediction results, with the R<sub>M</sub> values uniformly higher than 0.9 during the model training process. The other models (FA &#x2b; MIC, FA &#x2b; MMIC, IBFA &#x2b; MIC) performed less well than the IBFA &#x2b; MMIC model. The statistical significance of the presented models was validated by using a t-test. Aiming at 95% confidence level, the t values of these models were calculated and are listed in <xref ref-type="table" rid="T4">Table 4</xref>. In practice, the critical values of the t-test for each optimal model situation are different as the degrees of freedom vary, but all critical values are less than 2. The calculated t values of all optimal models for the prediction of Zn, Cr, Cu, and Pb were obviously larger than the critical t-test values, which validated that the selected feature variables are significant for model optimization. Specifically, the IBFA &#x2b; MMIC model has the largest calculated t values (2.74 for Zn, 2.63 for Cr, 2.65 for Cu, and 2.84 for Pb) of the models, which indicates that the proposed fusion model of IBFA &#x2b; MMIC performs best for both the validation samples and the testing samples. With this optimal modeling result, we confirmed the improvement of model prediction accuracy for estimating Zn, Cr, Cu, and Pb in soil.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Prediction results of the adaptive machine learning models by a combination of MIC and FA methods and their improvements.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Method</th>
<th rowspan="2" align="left">Content</th>
<th colspan="2" align="center">Modeling</th>
<th rowspan="2" align="center">Number of variables</th>
<th rowspan="2" align="center">t value<sup>(&#x23;)</sup>
</th>
<th colspan="2" align="center">Testing</th>
</tr>
<tr>
<th align="center">R<sub>M</sub>
</th>
<th align="center">RMSE<sub>M</sub>
</th>
<th align="center">R<sub>T</sub>
</th>
<th align="center">RMSE<sub>T</sub>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="4" align="center">FA &#x2b; MIC</td>
<td align="center">Zn</td>
<td align="center">0.915</td>
<td align="center">23.072</td>
<td align="center">230</td>
<td align="center">2.49</td>
<td align="center">0.874</td>
<td align="center">27.324</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">0.902</td>
<td align="center">13.124</td>
<td align="center">268</td>
<td align="center">2.58</td>
<td align="center">0.872</td>
<td align="center">15.650</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">0.890</td>
<td align="center">6.560</td>
<td align="center">286</td>
<td align="center">2.45</td>
<td align="center">0.863</td>
<td align="center">8.359</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">0.856</td>
<td align="center">6.786</td>
<td align="center">279</td>
<td align="center">2.52</td>
<td align="center">0.838</td>
<td align="center">7.729</td>
</tr>
<tr>
<td rowspan="4" align="center">FA &#x2b; MMIC</td>
<td align="center">Zn</td>
<td align="center">0.922</td>
<td align="center">18.396</td>
<td align="center">153</td>
<td align="center">2.52</td>
<td align="center">0.890</td>
<td align="center">24.631</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">0.916</td>
<td align="center">9.713</td>
<td align="center">148</td>
<td align="center">2.57</td>
<td align="center">0.884</td>
<td align="center">13.269</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">0.906</td>
<td align="center">5.145</td>
<td align="center">150</td>
<td align="center">2.48</td>
<td align="center">0.875</td>
<td align="center">7.033</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">0.864</td>
<td align="center">5.665</td>
<td align="center">158</td>
<td align="center">2.60</td>
<td align="center">0.853</td>
<td align="center">6.668</td>
</tr>
<tr>
<td rowspan="4" align="center">IBFA &#x2b; MIC</td>
<td align="center">Zn</td>
<td align="center">0.928</td>
<td align="center">16.802</td>
<td align="center">122</td>
<td align="center">2.48</td>
<td align="center">0.898</td>
<td align="center">20.691</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">0.921</td>
<td align="center">8.668</td>
<td align="center">128</td>
<td align="center">2.52</td>
<td align="center">0.887</td>
<td align="center">10.980</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">0.918</td>
<td align="center">4.611</td>
<td align="center">131</td>
<td align="center">2.53</td>
<td align="center">0.882</td>
<td align="center">6.417</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">0.898</td>
<td align="center">4.778</td>
<td align="center">143</td>
<td align="center">2.58</td>
<td align="center">0.868</td>
<td align="center">5.529</td>
</tr>
<tr>
<td rowspan="4" align="center">
<bold>IBFA &#x2b; MMIC</bold>
</td>
<td align="center">Zn</td>
<td align="center">0.938</td>
<td align="center">15.130</td>
<td align="center">79</td>
<td align="center">2.74</td>
<td align="center">0.899</td>
<td align="center">18.161</td>
</tr>
<tr>
<td align="center">Cr</td>
<td align="center">0.922</td>
<td align="center">6.993</td>
<td align="center">83</td>
<td align="center">2.63</td>
<td align="center">0.892</td>
<td align="center">9.545</td>
</tr>
<tr>
<td align="center">Cu</td>
<td align="center">0.927</td>
<td align="center">4.262</td>
<td align="center">85</td>
<td align="center">2.65</td>
<td align="center">0.895</td>
<td align="center">4.759</td>
</tr>
<tr>
<td align="center">Pb</td>
<td align="center">0.914</td>
<td align="center">4.633</td>
<td align="center">93</td>
<td align="center">2.84</td>
<td align="center">0.876</td>
<td align="center">4.824</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>
<sup>(&#x23;)</sup>The t value calculated during the t-test for significance analysis.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In other aspects, it is found that the IBFA &#x2b; MMIC eventually selects less informative variables than the other counterpart methods for model optimization. The applied feature variables are identified in the full spectral detection region (See <xref ref-type="fig" rid="F6">Figure 6</xref>). Successively, when using the selected feature variables for model testing, the model revealed appreciable testing results in terms of correlations (R<sub>T</sub>) and errors (RMSE<sub>T</sub>). The optimized model results are better than those of the previous IBFA-PLS models without MMIC improvement (with higher R<sub>M</sub> and lower RMSE<sub>M</sub> values). These results indicate that the proposed IBFA &#x2b; MMIC method is advantageous for the analysis of distributed spectral sensing data. Considering the differences in circumstances, the distributed data vary in dependence; each module must effectively test different emerging data from different located spots and each of the metals investigated to select the most suited model parameters for evolutionary iterative estimation of metal concentrations.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Selected feature wavenumbers selected by IBFA &#x002B; MMIC (Noted that the solid circles are labeling the selected wavenumbers).</p>
</caption>
<graphic xlink:href="fenvs-13-1656095-g006.tif">
<alt-text content-type="machine-generated">Four-panel chart displays FT-NIR absorbance versus wavenumber for Zn, Cr, Cu, and Pb using colored points and lines, highlighting selected wavenumbers for each element in red, blue, magenta, and green respectively.</alt-text>
</graphic>
</fig>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<label>4</label>
<title>Conclusion</title>
<p>This study proposed an intelligent modeling approach for the distributed sensing of soil heavy metal contamination across diverse geographical regions. Large-scale NIR spectral data from IoT-distributed sensors underwent federated analysis. For chemometric innovation, the IBFA and MMIC methods were integrated for iterative optimization of the calibration model, targeting the protection of fertile Karst soils in Guangxi ZAR, China. The IBFA &#x2b; MMIC fusion model outperformed other preset models in quantifying four heavy metals (Zn, Cr, Cu, and Pb). IBFA extracted informative variables from raw full-range spectral wavenumbers for each metal (see <xref ref-type="fig" rid="F6">Figure 6</xref>), and MMIC improved the fusion of distributed samples. During training, the IBFA &#x2b; MMIC model achieved R<sub>M</sub>&#x3e;0.9 and low RMSE<sub>M</sub>; in testing, it maintained R<sub>T</sub> close to 0.9 and exhibited lower RMSE<sub>T</sub> than the FA &#x2b; MIC, FA &#x2b; MMIC, and IBFA &#x2b; MIC models (see <xref ref-type="table" rid="T4">Table 4</xref>).</p>
<p>In conclusion, soil heavy metal contamination is a complex challenge that demands a comprehensive, multifaceted mitigation strategy. This study explored the correlations between NIR spectral data and target heavy metal concentrations, successfully identifying informative spectral features. In chemometric research, we investigated improvements to evolutionary learning methods, validating the practicality of spectral feature selection and establishing a novel research paradigm for optimizing NIR technology-driven models via iterative evolution. Specifically, the proposed IBFA &#x2b; MMIC fusion model is engineered to extract critical NIR spectral information, facilitating accurate quantitative prediction of diverse heavy metal contents in soil and providing valuable technical support for soil pollution monitoring. However, IBFA is somewhat sensitive to parameter tuning during optimization, with parameter initialization influencing iterative results. Moreover, while MMIC captures multi-variable correlations, it cannot identify synergistic interactions in variable combinations&#x2014;limitations that restrict the generalized application of the IBFA &#x2b; MMIC fusion algorithm. Future work will involve developing a more stable IBFA optimization approach via parameter uncertainty analysis and repeated sample modeling, as well as exploring novel projection methods to uncover variable interactions. This will further improve the fusion model&#x2019;s predictive performance and generalization, enabling NIR spectroscopic technology (aided by intelligent algorithm advancements) to effectively monitor soil heavy metal contamination and support soil management initiatives.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary material; further inquiries can be directed to the corresponding author.</p>
</sec>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>SH: Funding acquisition, Writing &#x2013; original draft, Data curation, Validation, Writing &#x2013; review and editing, Methodology. SZ: Writing &#x2013; original draft, Methodology, Software, Visualization, Formal Analysis. ML: Visualization, Investigation, Data curation, Writing &#x2013; original draft. FM: Formal analysis, Writing &#x2013; review and editing, Investigation. CH: Software, Writing &#x2013; review and editing, Validation. HC: Conceptualization, Resources, Project administration, Writing &#x2013; review and editing, Funding acquisition, Supervision.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s9">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<fn-group>
<fn fn-type="custom" custom-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2091122/overview">Pu Xia</ext-link>, University of Saskatchewan, Canada</p>
</fn>
<fn fn-type="custom" custom-type="reviewed-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1954046/overview">Shaohua Lei</ext-link>, Nanjing Hydraulic Research Institute, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/3270273/overview">Huanxue Zhang</ext-link>, Shandong Normal University, China</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Acharya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kogure</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Application of novel distributed fibre-optic sensing for slope deformation monitoring: a comprehensive review</article-title>. <source>Int. J. Environ. Sci. Technol.</source> <volume>20</volume>, <fpage>8217</fpage>&#x2013;<lpage>8240</lpage>. <pub-id pub-id-type="doi">10.1007/s13762-022-04697-5</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Al Maliki</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Owens</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hussain</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Al-Dahaan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Al-Ansari</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Chemometric methods to predict of Pb in urban soil from Port Pirie, South Australia, using spectrally active of soil carbon</article-title>. <source>Commun. Soil Sci. Plant Anal.</source> <volume>49</volume>, <fpage>1370</fpage>&#x2013;<lpage>1383</lpage>. <pub-id pub-id-type="doi">10.1080/00103624.2018.1464178</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ali</surname>
<given-names>J. K.</given-names>
</name>
<name>
<surname>Ghaleb</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Arangadi</surname>
<given-names>A. F.</given-names>
</name>
<name>
<surname>Le</surname>
<given-names>T. P. P.</given-names>
</name>
<name>
<surname>Moraetis</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pavlopoulos</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Comprehensive assessment of the capacity of sand and sandstone from aquifer vadose zone for the removal of heavy metals and dissolved organics</article-title>. <source>Environ. Technol. Innov.</source> <volume>29</volume>, <fpage>102993</fpage>. <pub-id pub-id-type="doi">10.1016/j.eti.2022.102993</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Babbar</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Soni</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Keshta</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Prasad</surname>
<given-names>K. D. V.</given-names>
</name>
<name>
<surname>Shabaz</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>Integrating remote sensing and geospatial AI-enhanced ISAC models for advanced localization and environmental monitoring</article-title>. <source>Environ. Earth Sci.</source> <volume>84</volume>, <fpage>118</fpage>. <pub-id pub-id-type="doi">10.1007/s12665-025-12121-7</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bourechak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zedadra</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Kouahla</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Guerrieri</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Seridi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fortino</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>At the confluence of artificial intelligence and edge computing in IoT-Based applications: a review and new perspectives</article-title>. <source>Sensors</source> <volume>23</volume>, <fpage>1639</fpage>. <pub-id pub-id-type="doi">10.3390/s23031639</pub-id>
<pub-id pub-id-type="pmid">36772680</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chamara</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Bai</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ge</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>AICropCAM: deploying classification, segmentation, detection, and counting deep-learning models for crop monitoring on the edge</article-title>. <source>Comput. Electron. Agric.</source> <volume>215</volume>, <fpage>108420</fpage>. <pub-id pub-id-type="doi">10.1016/j.compag.2023.108420</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Parametric-scaling optimization of pretreatment methods for the determination of trace/quasi-trace elements based on near infrared spectroscopy</article-title>. <source>Spectrochim. Acta - Part A Mol. Biomol. Spectrosc.</source> <volume>229</volume>, <fpage>117959</fpage>. <pub-id pub-id-type="doi">10.1016/j.saa.2019.117959</pub-id>
<pub-id pub-id-type="pmid">31884401</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2025</year>). <article-title>A fuzzy-refined neural network architecture for rapid assessment of seawater pollution by hyperspectral imaging</article-title>. <source>J. Clean. Prod.</source> <volume>512</volume>, <fpage>145704</fpage>. <pub-id pub-id-type="doi">10.1016/j.jclepro.2025.145704</pub-id>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chhabra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Kahlon</surname>
<given-names>K. S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Performance-aware energy-efficient parallel job scheduling in HPC grid using nature-inspired hybrid meta-heuristics</article-title>. <source>J. Ambient. Intell. Humaniz. Comput.</source> <volume>12</volume>, <fpage>1801</fpage>&#x2013;<lpage>1835</lpage>. <pub-id pub-id-type="doi">10.1007/s12652-020-02255-w</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cook</surname>
<given-names>R. D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A slice of multivariate dimension reduction</article-title>. <source>J. Multivar. Anal.</source> <volume>188</volume>, <fpage>104812</fpage>. <pub-id pub-id-type="doi">10.1016/j.jmva.2021.104812</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Daftsis</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Zachariadis</surname>
<given-names>G. A.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Analytical performance of a multi-element ICP-AES method for Cd, Co, Cr, Cu, Mn, Ni and Pb determination in blood fraction samples</article-title>. <source>Microchim. Acta</source> <volume>160</volume>, <fpage>405</fpage>&#x2013;<lpage>411</lpage>. <pub-id pub-id-type="doi">10.1007/s00604-007-0791-2</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dattatreya</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Khan</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Jena</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Chatterjee</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Conventional to modern methods of soil NPK sensing: a review</article-title>. <source>IEEE Sens. J.</source> <volume>24</volume>, <fpage>2367</fpage>&#x2013;<lpage>2380</lpage>. <pub-id pub-id-type="doi">10.1109/JSEN.2023.3334243</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Souza</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Filgueiras</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Coelho</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Fontana</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Winkler</surname>
<given-names>T. C. B.</given-names>
</name>
<name>
<surname>Valderrama</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Validation of the near infrared spectroscopy method for determining soil organic carbon by employing a proficiency assay for fertility laboratories</article-title>. <source>J. Near Infrared Spectrosc.</source> <volume>24</volume>, <fpage>293</fpage>&#x2013;<lpage>303</lpage>. <pub-id pub-id-type="doi">10.1255/jnirs.1219</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Devi</surname>
<given-names>K. G.</given-names>
</name>
<name>
<surname>Mishra</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Madan</surname>
<given-names>A. K.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A dynamic adaptive firefly algorithm for flexible job shop scheduling</article-title>. <source>Intell. Autom. Soft Comput.</source> <volume>31</volume>, <fpage>429</fpage>&#x2013;<lpage>448</lpage>. <pub-id pub-id-type="doi">10.32604/iasc.2022.019330</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ervural</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Hakli</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A binary reptile search algorithm based on transfer functions with a new stochastic repair method for 0-1 knapsack problems</article-title>. <source>Comput. Ind. Eng.</source> <volume>178</volume>, <fpage>109080</fpage>. <pub-id pub-id-type="doi">10.1016/j.cie.2023.109080</pub-id>
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gouda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Abu-hashim</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nassrallah</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Khalil</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Hendawy</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Benhasher</surname>
<given-names>F. F.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Integration of remote sensing and artificial neural networks for prediction of soil organic carbon in arid zones</article-title>. <source>Front. Environ. Sci.</source> <volume>12</volume> (<issue>1&#x2013;15</issue>), <fpage>1448601</fpage>. <pub-id pub-id-type="doi">10.3389/fenvs.2024.1448601</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Qing</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Bao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>Q.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Rapid determination of low heavy metal concentrations in grassland soils around mining using Vis-NIR spectroscopy: a case Study of Inner Mongolia, China</article-title>. <source>Sensors</source> <volume>21</volume>, <fpage>3220</fpage>. <pub-id pub-id-type="doi">10.3390/s21093220</pub-id>
<pub-id pub-id-type="pmid">34066493</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Latosinska</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kowalik</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Gawdzik</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Risk assessment of soil contamination with heavy metals from municipal sewage sludge</article-title>. <source>Appl. Sci.</source> <volume>11</volume>, <fpage>548</fpage>. <pub-id pub-id-type="doi">10.3390/app11020548</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leenen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Welp</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Gebbers</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Paetzold</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Rapid determination of lime requirement by mid-infrared spectroscopy: a promising approach for precision agriculture</article-title>. <source>J. Plant Nutr. Soil Sci.</source> <volume>182</volume>, <fpage>953</fpage>&#x2013;<lpage>963</lpage>. <pub-id pub-id-type="doi">10.1002/jpln.201800670</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Rapid quality discrimination of grape seed oil using an extreme machine learning approach with near-infrared (NIR) spectroscopy</article-title>. <source>Spectroscopy</source> <volume>36</volume>, <fpage>14</fpage>&#x2013;<lpage>20</lpage>.</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Hydrological characteristics and available water storage of typical karst soil in SW China under different soil-rock structures</article-title>. <source>Geoderma</source> <volume>438</volume>, <fpage>116633</fpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2023.116633</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>A Novel adaptive Robust NIR modeling method based on sparse Bayesian Learning</article-title>. <source>IEEE Trans. Ind. Inf.</source> <volume>20</volume>, <fpage>8499</fpage>&#x2013;<lpage>8511</lpage>. <pub-id pub-id-type="doi">10.1109/TII.2024.3367007</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Ai</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bian</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Extreme learning machine combined with whale optimization Algorithm for spectral quantitative analysis of complex samples</article-title>. <source>J. Chemom.</source> <volume>38</volume>, <fpage>3590</fpage>. <pub-id pub-id-type="doi">10.1002/cem.3590</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lovynska</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Bayat</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Bol</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Moradi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rahmati</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Raj</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Monitoring heavy metals and metalloids in soils and vegetation by remote sensing: a review</article-title>. <source>Remote Sens.</source> <volume>16</volume>, <fpage>3221</fpage>. <pub-id pub-id-type="doi">10.3390/rs16173221</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Maximal information coefficient and geodetector coupled quantification model: a new data-driven approach to coalbed methane reservoir potential evaluation</article-title>. <source>J. Pet. Explor. Prod. Technol.</source> <volume>14</volume>, <fpage>2937</fpage>&#x2013;<lpage>2951</lpage>. <pub-id pub-id-type="doi">10.1007/s13202-024-01880-x</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mana</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Pizzocaro</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The least informative distribution and correlation coefficient of measurement results</article-title>. <source>Metrologia</source> <volume>58</volume>, <fpage>015012</fpage>. <pub-id pub-id-type="doi">10.1088/1681-7575/abcbe9</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mortada</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Medhat</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sabry</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Sadek</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Shebl</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hassan</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Ultra-Compact fourier transform near-infrared MEMS spectral sensor for smart industry and IoT</article-title>. <source>IEEE J. Sel. Top. Quantum Electron.</source> <volume>27</volume>, <fpage>2</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1109/JSTQE.2021.3091375</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>E. S.</given-names>
</name>
<name>
<surname>Essam-Eldeen Sayed</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>W. S.</given-names>
</name>
<name>
<surname>Rebouh</surname>
<given-names>N. Y.</given-names>
</name>
<name>
<surname>Hammam</surname>
<given-names>A. A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Estimation of key potentially toxic elements in arid agricultural soils using Vis-NIR spectroscopy with variable selection and PLSR algorithms</article-title>. <source>Front. Environ. Sci.</source> <volume>11</volume> (<issue>1&#x2013;13</issue>), <fpage>1222871</fpage>. <pub-id pub-id-type="doi">10.3389/fenvs.2023.1222871</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paltseva</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Deeb</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Di Iorio</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Circelli</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Colombo</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction of bioaccessible lead in urban and suburban soils with Vis-NIR diffuse reflectance spectroscopy</article-title>. <source>Sci. Total Environ.</source> <volume>809</volume>, <fpage>151107</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2021.151107</pub-id>
<pub-id pub-id-type="pmid">34688767</pub-id>
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perkovic</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Paul</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Vasic</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Helming</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Human health and soil health risks from heavy metals, micro(nano)plastics, and antibiotic resistant bacteria in agricultural soils</article-title>. <source>Agronomy-Basel</source> <volume>12</volume>, <fpage>2945</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy12122945</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pourdarbani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sabzi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rohban</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Garc&#xed;a-Mateos</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Molina-Mart&#xed;nez</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Paliwal</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Metaheuristic algorithms in visible and near infrared spectra to detect excess nitrogen content in tomato plants</article-title>. <source>J. Near Infrared Spectrosc.</source> <volume>30</volume>, <fpage>197</fpage>&#x2013;<lpage>207</lpage>. <pub-id pub-id-type="doi">10.1177/09670335221098527</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Russell-Pavier</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Kaluvan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Megson-Smith</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Connor</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Fearn</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Connolly</surname>
<given-names>E. L.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>A highly scalable and autonomous spectroscopic radiation mapping system with resilient IoT detector units for dosimetry, safety and security</article-title>. <source>J. Radiol. Prot.</source> <volume>43</volume>, <fpage>011503</fpage>. <pub-id pub-id-type="doi">10.1088/1361-6498/acab0b</pub-id>
<pub-id pub-id-type="pmid">36595231</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Guang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Rapid determination of As and Pb concentrations in soil based binary Grey Wolf Optimization and partial least squares regression</article-title>. <source>Eurasian Soil Sci.</source> <volume>55</volume>, <fpage>1313</fpage>&#x2013;<lpage>1322</lpage>. <pub-id pub-id-type="doi">10.1134/S1064229322090071</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Surawijaya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chandra</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Sulthoni</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Idris</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Adiono</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Modeling and Simulation of Si Grating Photodetector Fabricated Using MACE Method for NIR Spectrum</article-title>. <source>Electron.</source> <volume>12</volume>, <fpage>663</fpage>. <pub-id pub-id-type="doi">10.3390/electronics12030663</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tao</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H. L.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. T.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>An integrated firefly algorithm for the optimization of constrained engineering design problems</article-title>. <source>Soft Comput.</source> <volume>28</volume>, <fpage>3207</fpage>&#x2013;<lpage>3250</lpage>. <pub-id pub-id-type="doi">10.1007/s00500-023-09305-3</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tian</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sheng</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>WSPXY combined with BP-ANN method for hemoglobin determination based on near-infrared spectroscopy</article-title>. <source>Infrared Phys. Technol.</source> <volume>102</volume>, <fpage>103003</fpage>. <pub-id pub-id-type="doi">10.1016/j.infrared.2019.103003</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Effects of hyperspectral data with different spectral resolutions on the estimation of soil heavy metal content: from ground-based and airborne data to satellite-simulated data</article-title>. <source>Sci. Total Environ.</source> <volume>838</volume>, <fpage>156129</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2022.156129</pub-id>
<pub-id pub-id-type="pmid">35605855</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zayani</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fouad</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Michot</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kassouk</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Baghdadi</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Vaudour</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Using machine-learning algorithms to predict soil organic carbon content from combined remote sensing imagery and laboratory Vis-NIR spectral datasets</article-title>. <source>Remote Sens.</source> <volume>15</volume>, <fpage>4264</fpage>. <pub-id pub-id-type="doi">10.3390/rs15174264</pub-id>
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Firefly forest: a swarm iteration-free swarm intelligence clustering algorithm</article-title>. <source>J. King Saud. Univ. Inf. Sci.</source> <volume>36</volume>, <fpage>102219</fpage>. <pub-id pub-id-type="doi">10.1016/j.jksuci.2024.102219</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>W. S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Spectral features extraction for estimation of soil total nitrogen content based on modified ant colony optimization algorithm</article-title>. <source>Geoderma</source> <volume>333</volume>, <fpage>23</fpage>&#x2013;<lpage>34</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2018.07.004</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Near Infrared feature waveband selection for fishmeal quality assessment by frequency adaptive binary differential evolution</article-title>. <source>Chemom. Intell. Lab. Syst.</source> <volume>217</volume>, <fpage>104393</fpage>. <pub-id pub-id-type="doi">10.1016/j.chemolab.2021.104393</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2024a</year>). <article-title>Hyperscale data analysis oriented optimization mechanisms for higher education management systems platforms with evolutionary intelligence</article-title>. <source>Appl. Soft Comput.</source> <volume>155</volume>, <fpage>111460</fpage>. <pub-id pub-id-type="doi">10.1016/j.asoc.2024.111460</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2024b</year>). <article-title>Study on the migration behaviour of heavy metals at the improved mine soil-plant rhizosphere interface</article-title>. <source>Environ. Technol.</source> <volume>45</volume>, <fpage>4691</fpage>&#x2013;<lpage>4703</lpage>. <pub-id pub-id-type="doi">10.1080/09593330.2023.2283061</pub-id>
<pub-id pub-id-type="pmid">37947180</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2024c</year>). <article-title>The occurrence and distributions characteristics of microplastics in soils of different land use patterns in Karst Plateau, Southwest China</article-title>. <source>Sci. Total Environ.</source> <volume>906</volume>, <fpage>167651</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2023.167651</pub-id>
<pub-id pub-id-type="pmid">37813260</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lei</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Handling data heterogeneity for IoT devices in federated learning: a knowledge fusion approach</article-title>. <source>IEEE Internet Things J.</source> <volume>11</volume>, <fpage>8090</fpage>&#x2013;<lpage>8104</lpage>. <pub-id pub-id-type="doi">10.1109/JIOT.2023.3319986</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zukowska</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bik-Malodzinska</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Myszura</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pawlowski</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pawlowska</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Effect of sewage sludge and mineral wool on water retention and heavy metal content in medium agronomic category soil</article-title>. <source>Environ. Prot. Eng.</source> <volume>47</volume>, <fpage>101</fpage>&#x2013;<lpage>110</lpage>. <pub-id pub-id-type="doi">10.37190/epe210407</pub-id>
</mixed-citation>
</ref>
</ref-list>
</back>
</article>