<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2024.1396183</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Estimation of the rice aboveground biomass based on the first derivative spectrum and Boruta algorithm</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Nian</surname>
<given-names>Ying</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2701722"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Su</surname>
<given-names>Xiangxiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2558409"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yue</surname>
<given-names>Hu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Yongji</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Weiqiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sheng</surname>
<given-names>Yali</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ma</surname>
<given-names>Qiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name>
<surname>Liu</surname>
<given-names>Jikai</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1983547"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes" equal-contrib="yes">
<name>
<surname>Li</surname>
<given-names>Xinwei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2694403"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Resource and Environment, Anhui Science and Technology University</institution>, <addr-line>Chuzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Anhui Province Crop Intelligent Planting and Processing Technology Engineering Research Center, Anhui Science and Technology University</institution>, <addr-line>Chuzhou, Anhui</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Anhui Province Agricultural Waste Fertilizer Utilization and Cultivated Land Quality Improvement Engineering Research Center, Anhui Science and Technology University</institution>, <addr-line>Chuzhou</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Ting Sun, China Jiliang University, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Muhammad Ahmad Hassan, Anhui Academy of Agricultural Sciences, China</p>
<p>Pan Gao, Shihezi University, China</p>
<p>Haibing He, Anhui Agricultural University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Jikai Liu, <email xlink:href="mailto:liujk@ahstu.edu.cn">liujk@ahstu.edu.cn</email>; Xinwei Li, <email xlink:href="mailto:lixw@ahstu.edu.cn">lixw@ahstu.edu.cn</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>04</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1396183</elocation-id>
<history>
<date date-type="received">
<day>05</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>04</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Nian, Su, Yue, Zhu, Li, Wang, Sheng, Ma, Liu and Li</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Nian, Su, Yue, Zhu, Li, Wang, Sheng, Ma, Liu and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Aboveground biomass (AGB) is regarded as a critical variable in monitoring crop growth and yield. The use of hyperspectral remote sensing has emerged as a viable method for the rapid and precise monitoring of AGB. Due to the extensive dimensionality and volume of hyperspectral data, it is crucial to effectively reduce data dimensionality and select sensitive spectral features to enhance the accuracy of rice AGB estimation models. At present, derivative transform and feature selection algorithms have become important means to solve this problem. However, few studies have systematically evaluated the impact of derivative spectrum combined with feature selection algorithm on rice AGB estimation. To this end, at the Xiaogang Village (Chuzhou City, China) Experimental Base in 2020, this study used an ASD FieldSpec handheld 2 ground spectrometer (Analytical Spectroscopy Devices, Boulder, Colorado, USA) to obtain canopy spectral data at the critical growth stage (tillering, jointing, booting, heading, and maturity stages) of rice, and evaluated the performance of the recursive feature elimination (RFE) and Boruta feature selection algorithm through partial least squares regression (PLSR), principal component regression (PCR), support vector machine (SVM) and ridge regression (RR). Moreover, we analyzed the importance of the optimal derivative spectrum. The findings indicate that (1) as the growth stage progresses, the correlation between rice canopy spectrum and AGB shows a trend from high to low, among which the first derivative spectrum (FD) has the strongest correlation with AGB. (2) The number of feature bands selected by the Boruta algorithm is 19~35, which has a good dimensionality reduction effect. (3) The combination of FD-Boruta-PCR (FB-PCR) demonstrated the best performance in estimating rice AGB, with an increase in R&#xb2; of approximately 10% ~ 20% and a decrease in RMSE of approximately 0.08% ~ 14%. (4) The best estimation stage is the booting stage, with R<sup>2</sup> values between 0.60 and 0.74 and RMSE values between 1288.23 and 1554.82 kg/hm<sup>2</sup>. This study confirms the accuracy of hyperspectral remote sensing in estimating vegetation biomass and further explores the theoretical foundation and future direction for monitoring rice growth dynamics.</p>
</abstract>
<kwd-group>
<kwd>rice</kwd>
<kwd>AGB</kwd>
<kwd>remote sensing</kwd>
<kwd>hyperspectral data</kwd>
<kwd>derivative transform</kwd>
<kwd>machine learning algorithm</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="2"/>
<equation-count count="3"/>
<ref-count count="83"/>
<page-count count="11"/>
<word-count count="6560"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Technical Advances in Plant Science</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Rice (<italic>Oryza sativa</italic>), a herbaceous plant belonging to the genus <italic>Oryza</italic>, has a long history of cultivation and a broad planting region (<xref ref-type="bibr" rid="B39">Krishnan et&#xa0;al., 2011</xref>). Aboveground biomass (AGB) serves as a critical indicator for describing crop growth (<xref ref-type="bibr" rid="B71">Wang et&#xa0;al., 2016</xref>). Applying scientific methods to estimate rice AGB to improve crop yields is crucial for human food security and increased economic benefits (<xref ref-type="bibr" rid="B63">Spiertz and Ewert, 2009</xref>; <xref ref-type="bibr" rid="B16">Devia et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B6">Cao et&#xa0;al., 2021b</xref>). The conventional method for acquiring AGB primarily involves field sampling, which is both time-consuming and laborious (<xref ref-type="bibr" rid="B26">Gnyp et&#xa0;al., 2014</xref>). In contrast, remote sensing technology provides a fast and nondestructive method, providing a scientific basis and technical support for accurate estimation of AGB (<xref ref-type="bibr" rid="B58">Schino et&#xa0;al., 2003</xref>). Among them, satellite remote sensing platforms is commonly used for AGB estimation in large areas, such as forests (<xref ref-type="bibr" rid="B47">Lucas et&#xa0;al., 2020</xref>), grasslands (<xref ref-type="bibr" rid="B17">Fang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B75">Yang et&#xa0;al., 2018</xref>), However, it is easily affected by spatial conditions and it is difficult to obtain satisfactory results at small field scales (<xref ref-type="bibr" rid="B81">Yue et&#xa0;al., 2019</xref>). UAV remote sensing platforms can perform low-altitude operations and obtain high-resolution images of crops, but the spectral resolution is low, which is not conducive to in-depth exploration of the spectral response of crops (<xref ref-type="bibr" rid="B3">Bansod et&#xa0;al., 2017</xref>). In comparison, near-ground hyperspectral remote sensing is not only suitable for small-scale crop monitoring, but can also acquire fine spectral data with high resolution and a broad spectrum of wavelengths, encapsulating abundant crop phenotype information and thereby offering increased opportunities for estimating the physical and chemical parameters of vegetation (<xref ref-type="bibr" rid="B21">Galv&#xe3;o et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B2">Atzberger et&#xa0;al., 2015</xref>).</p>
<p>To enhance the AGB estimation performance via hyperspectral remote sensing, the original spectral data are typically preprocessed to reduce noise and increase the accuracy of the data (<xref ref-type="bibr" rid="B48">Mishra et&#xa0;al., 2020</xref>). The Savitzky&#x2013;Golay (SG) smoothing algorithm and derivative transform are the principal methods for preprocessing. The SG smoothing algorithm helps to mitigate interference signals within spectral data and minimize random errors, thereby improving data reliability (<xref ref-type="bibr" rid="B56">Savitzky and Golay, 1964</xref>; <xref ref-type="bibr" rid="B46">Liu et&#xa0;al., 2014</xref>). Derivative transform spectrum emphasizes the absorption and reflection characteristics of the subject matter and augments the differentiation in spectral information (<xref ref-type="bibr" rid="B24">Gerretzen et&#xa0;al., 2015</xref>). For instance, <xref ref-type="bibr" rid="B70">Wang et&#xa0;al. (2004)</xref> demonstrated that the derivative spectrum can lessen the impact of noise, exhibits a high correlation with rice AGB, and performs effectively in estimating rice AGB. However, spectral data still face challenges such as excessive information redundancy and high dimensionality after preprocessing. There is a need for a reliable method that can reduce the dimensionality of spectral data and eliminate high correlations between bands.</p>
<p>In previous research, Some researchers have used a single vegetation index to estimate rice AGB and achieved good results. However, the vegetation indices is usually a combination of several sensitive wavelengths, ignoring a large volume of spectral information. In the 2020s, some scholars adopted complex dimensionality reduction methods to improve the utilization efficiency of rice spectral data. For example, <xref ref-type="bibr" rid="B34">Jia et&#xa0;al. (2022)</xref> used the continuous projection algorithm (SPA) to reduce the hyperspectral dimension and identified 12 characteristic bands to estimate the soil plant analysis development (SPAD) content of rice. <xref ref-type="bibr" rid="B80">Yu et&#xa0;al. (2020)</xref> utilized principal component analysis (PCA) to extract five principal components for the inversion of rice leaf nitrogen deficiency. The above studies used different dimensionality reduction methods to reduce spectral data redundancy, which is of positive significance for applying hyperspectral remote sensing technology to estimate rice AGB accurately. However, they present limitations. The objective of SPA is to eliminate combinations of variables that exhibit low collinearity and include distinctive information; however, this approach might omit some initial characteristics in the spectral data (<xref ref-type="bibr" rid="B5">Cao et&#xa0;al., 2021a</xref>). PCA is capable of using several independent principal components to depict the original data, yet this technique is confined to linear projection and exhibits inadequate performance in managing nonlinear data relationships (<xref ref-type="bibr" rid="B49">Moore, 1981</xref>; <xref ref-type="bibr" rid="B1">Abdi and Williams, 2010</xref>). Consequently, the effectiveness of the monitoring model in practical scenarios may be affected by different dimensionality reduction methods (<xref ref-type="bibr" rid="B20">Fu et&#xa0;al., 2020</xref>). Given these considerations, selecting a suitable dimensionality reduction method is essential for accurately identifying sensitive bands and enhancing the accuracy of the estimation model.</p>
<p>As a data dimensionality reduction method, the core of Boruta algorithm is to find all feature bands related to the dependent variable. Compared with other commonly used feature screening algorithms, Compared with other commonly used feature screening algorithms (<xref ref-type="bibr" rid="B41">Kursa and Rudnicki, 2010</xref>; <xref ref-type="bibr" rid="B40">Kursa et&#xa0;al., 2010</xref>). The algorithm was originally used in biological and medical fields and has since been used in agricultural research as well. For instance, <xref ref-type="bibr" rid="B42">Li et&#xa0;al. (2022)</xref> demonstrated that filtering spectral indices from winter wheat canopy hyperspectral data using the Boruta algorithm enhances data validity and establishes an accurate yield estimation model. The Boruta algorithm has great potential in physical and chemical parameter estimation. To further evaluate the ability of the Boruta algorithm to estimate rice AGB, this study also selected the RFE feature selection algorithm for comparison. RFE, an adaptive feature selection algorithm, iteratively removes the least important feature variables and ranks feature importance until the optimal feature subset is identified. This approach minimizes the effects of random fluctuations and interference information (<xref ref-type="bibr" rid="B69">Tunca et&#xa0;al., 2023</xref>). <xref ref-type="bibr" rid="B78">Yoosefzadeh-Najafabadi et&#xa0;al. (2021)</xref> applied RFE to determine the optimal wavelengths from hyperspectral data for soybean yield prediction. This indicates that these feature selection methods are effective in improving estimation models&#x2019; accuracy. However, relatively few studies have utilized the Boruta algorithm and the RFE algorithm for feature selection of derivative spectra to construct rice AGB estimation models.</p>
<p>Therefore, this study used the Boruta and RFE algorithms to eliminate interference information, identify sensitive bands, and integrate partial least squares regression (PLSR), principal component regression (PCR), support vector machine (SVM) and ridge regression (RR) to develop an AGB estimation model. Additionally, this study compares the estimation effects of various combinations of dimensionality reduction algorithms and machine learning models to identify the most accurate estimation results. The research objectives were to (1) compare the correlations between derivative spectrum of different orders and rice AGB to determine the optimal order; (2) evaluate the effectiveness of the Boruta algorithm and RFE algorithm in selecting feature bands to determine the best dimensionality reduction method; (3) evaluate the estimation capability of machine learning algorithms combined with feature selection algorithms on rice AGB; and (4) identify the optimal combination of models and the most suitable estimation stage.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Experimental design</title>
<p>The study was conducted in Xiaogang village, Fengyang County, Chuzhou city, Anhui Province, China (longitude 117&#xb0;46&#x2032;7&#x2033;E, latitude 32&#xb0;48&#x2032;52&#x2033;N) (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>), which is characterized by a subtropical monsoon climate, an average annual temperature of 15.4&#xb0;C, and an average annual precipitation of 1179.2 mm. The soil predominantly consists of clay with medium fertility on flat terrain. The experimental area included 36 plots, measuring 2 m &#xd7; 8 m each. The rice varieties tested were Runzhuxiangzhan (V1), Runzhuyinzhan (V2), and Hongxiangnuo (V3), with each plot replicated three times. Four nitrogen gradient treatments were applied with nitrogen application rates of N0 (0 kg/hm&#xb2;), N1 (100 kg/hm&#xb2;), N2 (200 kg/hm&#xb2;), and N3 (300 kg/hm&#xb2;). Phosphorus (90 kg/hm&#xb2;) and potash (135 kg/hm&#xb2;) fertilizers were applied once as basal fertilizer (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). The experiment spanned from June 2020 to October 2020. The plants experienced no drought or flooding during the seedling stage and favorable conditions of abundant sunshine and moderate temperatures during the mid-growth stage, which are conducive to rice growth and development. Field management practices followed local cultivation methods and pest control technologies.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Rice experimental area <bold>(A, B)</bold> and data collection <bold>(C)</bold>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1396183-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Data acquisition</title>
<sec id="s2_2_1">
<label>2.2.1</label>
<title>Ground data acquisition</title>
<p>Rice samples were collected on July 25 (tillering stage), August 13 (jointing stage), August 23 (booting stage), August 31 (heading stage) and September 20 (maturity stage). The sampling time was consistent with the hyperspectral data acquisition time. Rice samples were collected from three holes in each plot, and the locations of the sampling points were marked after each sampling to avoid duplicate sampling.</p>
<p>Rice samples were subsequently sent to the laboratory, after which stem, leaf, and ear separation was performed (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>). The sample was placed in an oven, dried for 0.5 h after the temperature increased to 105&#xb0;C, and then adjusted to 75&#xb0;C for more than 24 h until the mass was constant. The dry mass of the sample was obtained by summing the dry mass of the stem, leaves and ears of the plant. Finally, the aboveground biomass of the rice plants in each plot was obtained through the dry mass of the sample and the row spacing during rice planting.</p>
</sec>
<sec id="s2_2_2">
<label>2.2.2</label>
<title>Hyperspectral data collection</title>
<p>Hyperspectral data on the rice canopy spectra were collected using a handheld ground spectrometer (ASD FieldSpec&#xae; HandHeld&#x2122;2) covering a wavelength range from 325 to 1075 nm with a resolution of 1 nm. Measurements were conducted between 10:00 a.m. and 2:00 p.m. for each test. Prior to each measurement session, the instrument was calibrated against a standard radiation white plate and recalibrated after every two blocks to ensure accuracy. The data were collected at three evenly distributed points along the diagonal of each plot, with the spectrometer positioned vertically 0.5 m above the rice canopy (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1C</bold>
</xref>). The spectral data from the same plot were processed collectively, and the average spectral reflectance of the plot was calculated.</p>
</sec>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Hyperspectral data processing</title>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>SG smoothing and derivative transform</title>
<p>The Savitzky&#x2212;Golay (SG) smoothing algorithm, a digital signal processing technique proposed by Savitzky and Golay, is employed to enhance signal frequency and eliminate data noise (<xref ref-type="bibr" rid="B56">Savitzky and Golay, 1964</xref>). The smoothing effect of the algorithm, which varies with the window length, preserves the original shape and peak heights of the wave signal (<xref ref-type="bibr" rid="B57">Schafer, 2011</xref>). To minimize data fluctuations, capture the overall trend of the spectral curves, and accurately analyze the spectral characteristics of rice, this study applied SG smoothing to the canopy spectral curves from 325 to 1075 nm recorded during the growth stage (<xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B61">Shi et&#xa0;al., 2021</xref>). However, due to the influence of noise, only the 400 to 900 nm range was selected for analysis.</p>
<p>Derivative transform serves to diminish background signals, with the FD highlighting absorption peaks and shoulders in the original spectrum (OS) (<xref ref-type="bibr" rid="B15">Demetriades-Shah et&#xa0;al., 1990</xref>; <xref ref-type="bibr" rid="B4">Becker et&#xa0;al., 2005</xref>). By differentiating peaks and valleys, more precise spectral reflectance data can be obtained (<xref ref-type="bibr" rid="B33">Ji et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B83">Zhao et&#xa0;al., 2022</xref>). The second derivative spectrum (SD) facilitates the accurate identification of absorption peak and shoulder positions within the OS, enhancing spectral reflectance differentiation and eliminating baseline offsets in spectral reflectance data (<xref ref-type="bibr" rid="B76">Yang et&#xa0;al., 2011</xref>). This study utilized the derivative function within the Origin software&#x2019;s data processing menu (Origin 2018) for these transformations.</p>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Feature selection</title>
<p>Feature selection algorithms play a pivotal role in optimizing datasets prior to model construction. In this investigation, both the Boruta algorithm and the RFE algorithm were employed for feature selection.</p>
<p>The Boruta algorithm (<xref ref-type="bibr" rid="B53">Prasad et&#xa0;al., 2019</xref>) is an innovative feature selection method derived from the random forest approach. It identifies all characteristic bands in spectral data that are related to dependent variables, thereby elucidating the relationship between spectral characteristics and rice AGB. The foundational concept involves shuffling the original parameters to create shadow parameters, which are then combined with the original parameters into a feature matrix for training. Based on the importance scores from the random forest, the shadow parameters are ranked by importance, with the highest value designated the Z score. Original parameters more significant than the Z score are labeled &#x201c;most important&#x201d;, while those below are deemed &#x201c;unimportant&#x201d; and thus eliminated. Ultimately, the most important original parameters are selected as the optimal combination for constructing the inversion model.</p>
<p>Recursive feature elimination (RFE) (<xref ref-type="bibr" rid="B27">Guyon et&#xa0;al., 2002</xref>) is a wrapper-based selection method that starts with the construction of an initial model, ranking all feature bands by their importance, and iteratively removing the least significant features. By retraining the model with the remaining features and repeating this process, it gradually identifies the most critical subset of features. This algorithm excels by iteratively evaluating the contribution of each feature band to the model, thereby identifying the optimal feature subset to reveal the underlying structure and patterns within the data.</p>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Model construction method</title>
<p>To thoroughly investigate the relationships between the independent and dependent variables, four machine learning models were selected for comparison: PLSR, PCR, SVM, and RR.</p>
<p>PLSR (<xref ref-type="bibr" rid="B23">Geladi and Kowalski, 1986</xref>) is a multivariate linear statistical method that focuses on finding a hyperplane that minimizes the variance between the response and independent variables. It projects predictor and observed variables into a new space to derive a linear regression model, known as a bilinear factor model, due to the presence of both data X and Y in this new space.</p>
<p>PCR (<xref ref-type="bibr" rid="B37">Kawano et&#xa0;al., 2018</xref>) employs PCA for predictive data mining, transforming original variables into principal components that are linear combinations of the original variables and mutually independent. Regression analysis is then performed on these principal components to derive the regression equation, which is subsequently applied to the original variables.</p>
<p>SVM (<xref ref-type="bibr" rid="B66">Suykens and Vandewalle, 1999</xref>) operates as a supervised learning model utilized for analyzing data in classification and regression analysis. The core concept involves identifying the optimal classification hyperplane for two types of samples in the original space when they are linearly separable. In instances where linear separability is not achievable, the samples are projected into a high-dimensional feature space where an optimal hyperplane is determined. This hyperplane classifies the samples, aiming to minimize the distance within similar classes and maximize the distance between distinct classes.</p>
<p>RR (<xref ref-type="bibr" rid="B32">Ivanda et&#xa0;al., 2021</xref>) serves as a technique for estimating the coefficients of a multiple regression model in scenarios where the independent variables exhibit high correlation. This is achieved by incorporating an L2 regularization term into the OLS loss function. The L2 regularization term is calculated as the product of the sum of the squares of the coefficients and a regularization parameter &#x3bb; (lambda).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Accuracy evaluation</title>
<p>In this study, 70% of the sample data (n=25) were selected as the modeling set for each growth stage, and 30% of the sample data (n=11) were used as the validation set to construct the rice AGB estimation model. The coefficient of determination (R&#xb2;), root mean square error (RMSE), and mean absolute error (MAE) were used to evaluate the model accuracy. The closer R&#xb2; is to 1, the lower the RMSE and MAE are, and the higher the accuracy of the estimation model is. R&#xb2;, RMSE and MAE are calculated using <xref ref-type="disp-formula" rid="eq1">Equations 1</xref>&#x2013;<xref ref-type="disp-formula" rid="eq3">3</xref>, respectively:</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:msup>
<mml:mtext>R</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>y</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mtext>RMSE</mml:mtext>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>y</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:mfrac>
<mml:mtext>&#xa0;</mml:mtext>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mtext>MAE</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:msubsup>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>y</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mtext>n</mml:mtext>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Note: <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:msub>
<mml:mtext>x</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:msub>
<mml:mtext>y</mml:mtext>
<mml:mtext>i</mml:mtext>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im3">
<mml:mover accent="true">
<mml:mi>x</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> are the actual measured value, predicted value and average value of the measured data, respectively; n is the number of samples.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<p>SG smoothing was applied to the spectral curves within the 400 to 900 nm range, The processing results of OS, FD and SD at different growth stages are shown in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Derivative transformation spectral curves of rice canopy at different growth stages. <bold>(A)</bold> original spectrum, <bold>(B)</bold> first derivative spectrum, <bold>(C)</bold> second derivative spectrum.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1396183-g002.tif"/>
</fig>
<p>The processing results for the OS reveal the characteristic spectral profile of the rice canopy, marked by typical green plant reflectance features, with spectral reflectance values ranging from 0 to 0.5. Notably, a reflection peak and an absorption valley are observed near wavelengths of 550 nm and 680 nm, respectively, both of which are situated within the visible light spectrum. The spectral reflectance of rice rapidly increases within the 680 to 750 nm range, creating a &#x201c;red edge&#x201d; phenomenon (<xref ref-type="bibr" rid="B25">Gitelson et&#xa0;al., 1996</xref>). The first peak of the FD curve appears at 500 ~ 550 nm. The band range of 680 ~ 750 nm shows a drastic change that first rises and then falls. The SD curve exhibits continuous fluctuations across the 500 to 690 nm band range, with two notable peaks within the 700 to 800 nm band range.</p>
<sec id="s3_1">
<label>3.1</label>
<title>Correlations between different orders of derivative spectrum and rice AGB</title>
<p>To fully explore the sensitivity of the different orders of rice canopy spectra and to compare the effects of spectral transformations on AGB, FD and SD transformations were carried out on the basis of OS, and their correlations with rice AGB were investigated (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Correlation between rice canopy spectra and AGB at different growth stages. <bold>(A-E)</bold> The correlation between OS and AGB; <bold>(F-J)</bold> the correlation between FD and AGB; <bold>(K-O)</bold> the correlation between SD and AGB.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1396183-g003.tif"/>
</fig>
<p>During the full growth stage, the correlation between OS and AGB showed a consistent trend from negative to positive as the band increased, with the maximum correlation at 720 nm. The correlation curve between FD and AGB shows a continuous fluctuation trend in the 400 ~ 900 nm band, among which the 680 ~ 750 nm band has the highest correlation, with a correlation coefficient between 0.60 ~ 0.85. The correlation curve between SD and AGB was similar to that between FD and AGB, but the fluctuations were more severe.</p>
<p>In summary, the derivative spectrum of the different orders were compared with the maximum absolute value of the AGB correlation coefficient (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). Except for the tillering stage, the maximum values in the other four periods all occurred at FD. Comprehensive analysis revealed that the FD could better reflect the growth status of rice, so the FD was used as the input variable of the feature screening algorithm for subsequent construction of the AGB estimation model.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>The maximum absolute value of the correlation coefficient between different order derivative spectra and AGB.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1396183-g004.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Feature band selection</title>
<p>An AGB estimation model utilizing PLSR, PCR, SVM, and RR was developed to evaluate the effectiveness of the band screening algorithms. This model incorporated characteristic bands selected by both the Boruta algorithm and the RFE algorithm, as well as the full band as input variables. The diversity and scope of the characteristic bands selected by these feature screening algorithms during different growth stages are summarized in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. Detailed feature selection results are shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Appendix 2</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Comparison of feature selection results between the Boruta algorithm and RFE algorithm.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Feature selection algorithm</th>
<th valign="middle" align="center">Growth<break/>Stage</th>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Feature band range (nm)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="5" align="center">Boruta</td>
<td valign="middle" align="left">Tillering</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">724 ~ 761</td>
</tr>
<tr>
<td valign="middle" align="center">Jointing</td>
<td valign="top" align="center">35</td>
<td valign="top" align="center">644, 721 ~ 771, 816, 817</td>
</tr>
<tr>
<td valign="middle" align="center">Booting</td>
<td valign="top" align="center">27</td>
<td valign="top" align="center">664 ~ 694, 717 ~ 774</td>
</tr>
<tr>
<td valign="middle" align="center">Heading</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">414, 416, 699 ~ 777,817, 873</td>
</tr>
<tr>
<td valign="top" align="center">Maturity</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">420, 498, 686 ~ 759, 842</td>
</tr>
<tr>
<td valign="middle" rowspan="5" align="center">RFE</td>
<td valign="middle" align="left">Tillering</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">742, 751, 761</td>
</tr>
<tr>
<td valign="middle" align="center">Jointing</td>
<td valign="top" align="center">392</td>
<td valign="top" align="center">402 ~ 900</td>
</tr>
<tr>
<td valign="middle" align="center">Booting</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">753, 754, 764</td>
</tr>
<tr>
<td valign="middle" align="center">Heading</td>
<td valign="top" align="center">127</td>
<td valign="top" align="left">402 ~ 495, 507 ~ 594, 614 ~ 699, 702 ~ 900</td>
</tr>
<tr>
<td valign="top" align="center">Maturity</td>
<td valign="top" align="center">439</td>
<td valign="top" align="center">400 ~ 900</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The Boruta algorithm demonstrated remarkable stability, with the number of characteristic wavelengths in each growth stage not exceeding 40. In contrast, the RFE algorithm showed more significant fluctuations, with 3 characteristic wavelengths identified at both the tillering and booting stages and 439 at the maturity stage, indicating substantial variance in the number of wavelengths identified across different growth stages. Notably, the characteristic wavelengths identified by both screening algorithms predominantly fall within the &#x201c;red edge&#x201d; spectral range, highlighting their importance in estimating rice AGB.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Establishment and evaluation of the rice AGB estimation model based on FD</title>
<p>This study employs three types of model input variables: first derivative full band (FD-FB), the characteristic bands selected by the Boruta algorithm (FD-Boruta), and the characteristic bands selected by the RFE algorithm (FD-RFE). Sixty AGB estimation models were developed for various growth stages using four machine learning algorithms (PLSR, PCR, SVM, RR), with R&#xb2; (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>), RMSE (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>) and MAE (<xref ref-type="supplementary-material" rid="SM1">
<bold>Appendix 1</bold>
</xref>) serving as the model evaluation metrics.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Comparison of the R&#xb2; values of the different estimation models for the validation sets. PLSR, partial least squares regression; PCR, principal component regression; SVM, support vector machine; RR, ridge regression.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1396183-g005.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Rice AGB estimation model under different machine learning algorithms (R<sup>2</sup>, RMSE).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="3" align="left">machine learning algorithm</th>
<th valign="top" rowspan="3" align="center">Bandselection algorithm</th>
<th valign="top" colspan="4" align="center">Tillering</th>
<th valign="top" colspan="4" align="center">Jointing</th>
<th valign="top" colspan="4" align="center">Booting</th>
<th valign="top" colspan="4" align="center">Heading</th>
<th valign="top" colspan="4" align="center">Maturity</th>
</tr>
<tr>
<th valign="top" colspan="2" align="center">Modeling Set</th>
<th valign="top" colspan="2" align="center">Validation Set</th>
<th valign="top" colspan="2" align="center">Modeling Set</th>
<th valign="top" colspan="2" align="center">Validation Set</th>
<th valign="top" colspan="2" align="center">Modeling Set</th>
<th valign="top" colspan="2" align="center">Validation Set</th>
<th valign="top" colspan="2" align="center">Modeling Set</th>
<th valign="top" colspan="2" align="center">ValidationSet</th>
<th valign="top" colspan="2" align="center">Modeling Set</th>
<th valign="top" colspan="2" align="center">Validation Set</th>
</tr>
<tr>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
<th valign="top" align="center">R&#xb2;</th>
<th valign="top" align="center">RMSE(kg/hm&#xb2;)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" rowspan="3" align="left">PLSR</td>
<td valign="top" align="left">Boruta</td>
<td valign="top" align="left">0.54</td>
<td valign="top" align="left">427.85</td>
<td valign="top" align="left">0.61</td>
<td valign="top" align="left">464.34</td>
<td valign="top" align="left">0.68</td>
<td valign="top" align="left">801.67</td>
<td valign="top" align="left">0.57</td>
<td valign="top" align="left">1072.49</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">1096.66</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1351.62</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">1125.80</td>
<td valign="top" align="left">0.67</td>
<td valign="top" align="left">1405.25</td>
<td valign="top" align="left">0.49</td>
<td valign="top" align="left">2017.00</td>
<td valign="top" align="left">0.43</td>
<td valign="top" align="left">2515.77</td>
</tr>
<tr>
<td valign="top" align="left">RFE</td>
<td valign="top" align="left">0.53</td>
<td valign="top" align="left">434.66</td>
<td valign="top" align="left">0.57</td>
<td valign="top" align="left">493.81</td>
<td valign="top" align="left">0.78</td>
<td valign="top" align="left">635.91</td>
<td valign="top" align="left">0.47</td>
<td valign="top" align="left">1226.82</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1148.63</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1336.75</td>
<td valign="top" align="left">0.80</td>
<td valign="top" align="left">908.01</td>
<td valign="top" align="left">0.67</td>
<td valign="top" align="left">1398.94</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">1736.85</td>
<td valign="top" align="left">0.43</td>
<td valign="top" align="left">2407.61</td>
</tr>
<tr>
<td valign="top" align="left">FB</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">324.48</td>
<td valign="top" align="left">0.59</td>
<td valign="top" align="left">473.29</td>
<td valign="top" align="left">0.77</td>
<td valign="top" align="left">644.07</td>
<td valign="top" align="left">0.46</td>
<td valign="top" align="left">1245.08</td>
<td valign="top" align="left">0.81</td>
<td valign="top" align="left">912.34</td>
<td valign="top" align="left">0.64</td>
<td valign="top" align="left">1474.44</td>
<td valign="top" align="left">0.79</td>
<td valign="top" align="left">948.73</td>
<td valign="top" align="left">0.60</td>
<td valign="top" align="left">1547.85</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">1744.52</td>
<td valign="top" align="left">0.43</td>
<td valign="top" align="left">2406.05</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="left">PCR</td>
<td valign="top" align="left">Boruta</td>
<td valign="top" align="left">0.54</td>
<td valign="top" align="left">427.33</td>
<td valign="top" align="left">0.60</td>
<td valign="top" align="left">469.15</td>
<td valign="top" align="left">0.64</td>
<td valign="top" align="left">853.54</td>
<td valign="top" align="left">0.60</td>
<td valign="top" align="left">1057.88</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">1101.43</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">1290.24</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1171.49</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">1307.01</td>
<td valign="top" align="left">0.45</td>
<td valign="top" align="left">2120.01</td>
<td valign="top" align="left">0.45</td>
<td valign="top" align="left">2392.65</td>
</tr>
<tr>
<td valign="top" align="left">RFE</td>
<td valign="top" align="left">0.53</td>
<td valign="top" align="left">435.68</td>
<td valign="top" align="left">0.57</td>
<td valign="top" align="left">493.77</td>
<td valign="top" align="left">0.43</td>
<td valign="top" align="left">1067.73</td>
<td valign="top" align="left">0.41</td>
<td valign="top" align="left">1311.00</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1150.33</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1338.99</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1180.64</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1321.14</td>
<td valign="top" align="left">0.43</td>
<td valign="top" align="left">2178.91</td>
<td valign="top" align="left">0.41</td>
<td valign="top" align="left">2412.86</td>
</tr>
<tr>
<td valign="top" align="left">FB</td>
<td valign="top" align="left">0.55</td>
<td valign="top" align="left">423.94</td>
<td valign="top" align="left">0.61</td>
<td valign="top" align="left">477.47</td>
<td valign="top" align="left">0.41</td>
<td valign="top" align="left">1087.71</td>
<td valign="top" align="left">0.39</td>
<td valign="top" align="left">1332.82</td>
<td valign="top" align="left">0.68</td>
<td valign="top" align="left">1186.97</td>
<td valign="top" align="left">0.65</td>
<td valign="top" align="left">1465.01</td>
<td valign="top" align="left">0.59</td>
<td valign="top" align="left">1377.74</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">1541.66</td>
<td valign="top" align="left">0.41</td>
<td valign="top" align="left">2205.87</td>
<td valign="top" align="left">0.40</td>
<td valign="top" align="left">2430.66</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="left">SVM</td>
<td valign="top" align="left">Boruta</td>
<td valign="top" align="left">0.67</td>
<td valign="top" align="left">368.29</td>
<td valign="top" align="left">0.66</td>
<td valign="top" align="left">434.33</td>
<td valign="top" align="left">0.80</td>
<td valign="top" align="left">663.56</td>
<td valign="top" align="left">0.65</td>
<td valign="top" align="left">985.55</td>
<td valign="top" align="left">0.86</td>
<td valign="top" align="left">800.08</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">1349.87</td>
<td valign="top" align="left">0.82</td>
<td valign="top" align="left">902.99</td>
<td valign="top" align="left">0.66</td>
<td valign="top" align="left">1411.43</td>
<td valign="top" align="left">0.85</td>
<td valign="top" align="left">1135.73</td>
<td valign="top" align="left">0.52</td>
<td valign="top" align="left">2189.95</td>
</tr>
<tr>
<td valign="top" align="left">RFE</td>
<td valign="top" align="left">0.67</td>
<td valign="top" align="left">367.30</td>
<td valign="top" align="left">0.65</td>
<td valign="top" align="left">445.05</td>
<td valign="top" align="left">0.97</td>
<td valign="top" align="left">329.32</td>
<td valign="top" align="left">0.35</td>
<td valign="top" align="left">1370.60</td>
<td valign="top" align="left">0.75</td>
<td valign="top" align="left">1073.13</td>
<td valign="top" align="left">0.74</td>
<td valign="top" align="left">1311.04</td>
<td valign="top" align="left">0.99</td>
<td valign="top" align="left">216.76</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1430.80</td>
<td valign="top" align="left">0.96</td>
<td valign="top" align="left">716.15</td>
<td valign="top" align="left">0.22</td>
<td valign="top" align="left">2964.74</td>
</tr>
<tr>
<td valign="top" align="left">FB</td>
<td valign="top" align="left">0.80</td>
<td valign="top" align="left">481.27</td>
<td valign="top" align="left">0.27</td>
<td valign="top" align="left">701.52</td>
<td valign="top" align="left">0.98</td>
<td valign="top" align="left">276.86</td>
<td valign="top" align="left">0.32</td>
<td valign="top" align="left">1412.37</td>
<td valign="top" align="left">0.97</td>
<td valign="top" align="left">486.02</td>
<td valign="top" align="left">0.19</td>
<td valign="top" align="left">2316.48</td>
<td valign="top" align="left">0.98</td>
<td valign="top" align="left">386.45</td>
<td valign="top" align="left">0.30</td>
<td valign="top" align="left">2266.78</td>
<td valign="top" align="left">0.95</td>
<td valign="top" align="left">852.86</td>
<td valign="top" align="left">0.19</td>
<td valign="top" align="left">2980.00</td>
</tr>
<tr>
<td valign="top" rowspan="3" align="left">RR</td>
<td valign="top" align="left">Boruta</td>
<td valign="top" align="left">0.58</td>
<td valign="top" align="left">421.84</td>
<td valign="top" align="left">0.60</td>
<td valign="top" align="left">504.74</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">764.35</td>
<td valign="top" align="left">0.62</td>
<td valign="top" align="left">1009.78</td>
<td valign="top" align="left">0.76</td>
<td valign="top" align="left">1036.43</td>
<td valign="top" align="left">0.71</td>
<td valign="top" align="left">1301.00</td>
<td valign="top" align="left">0.81</td>
<td valign="top" align="left">955.61</td>
<td valign="top" align="left">0.68</td>
<td valign="top" align="left">1370.52</td>
<td valign="top" align="left">0.63</td>
<td valign="top" align="left">1827.13</td>
<td valign="top" align="left">0.53</td>
<td valign="top" align="left">2217.62</td>
</tr>
<tr>
<td valign="top" align="left">RFE</td>
<td valign="top" align="left">0.53</td>
<td valign="top" align="left">435.50</td>
<td valign="top" align="left">0.55</td>
<td valign="top" align="left">513.04</td>
<td valign="top" align="left">0.90</td>
<td valign="top" align="left">513.16</td>
<td valign="top" align="left">0.53</td>
<td valign="top" align="left">1120.75</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1144.30</td>
<td valign="top" align="left">0.72</td>
<td valign="top" align="left">1288.23</td>
<td valign="top" align="left">0.94</td>
<td valign="top" align="left">579.73</td>
<td valign="top" align="left">0.70</td>
<td valign="top" align="left">1318.70</td>
<td valign="top" align="left">0.91</td>
<td valign="top" align="left">1102.65</td>
<td valign="top" align="left">0.32</td>
<td valign="top" align="left">2628.54</td>
</tr>
<tr>
<td valign="top" align="left">FB</td>
<td valign="top" align="left">0.95</td>
<td valign="top" align="left">192.63</td>
<td valign="top" align="left">0.46</td>
<td valign="top" align="left">514.86</td>
<td valign="top" align="left">0.90</td>
<td valign="top" align="left">518.87</td>
<td valign="top" align="left">0.50</td>
<td valign="top" align="left">1160.32</td>
<td valign="top" align="left">0.94</td>
<td valign="top" align="left">627.07</td>
<td valign="top" align="left">0.60</td>
<td valign="top" align="left">1554.82</td>
<td valign="top" align="left">0.95</td>
<td valign="top" align="left">612.77</td>
<td valign="top" align="left">0.57</td>
<td valign="top" align="left">1588.79</td>
<td valign="top" align="left">0.92</td>
<td valign="top" align="left">1095.07</td>
<td valign="top" align="left">0.29</td>
<td valign="top" align="left">2648.03</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>PLSR, partial least squares regression; PCR, principal component regression; SVM, support vector machine; RR, ridge regression.</p>
</table-wrap-foot>
</table-wrap>
<p>Initially, the AGB estimation abilities of different feature selection algorithms were compared within the same model framework. In the PLSR model, the estimation precision for FD-Boruta and FD-RFE was found to be comparable, with R&#xb2; values ranging from 0.43 to 0.70, and RMSE values between 464.34 and 2515.77 kg/hm&#xb2; and 493.81 and 2407.61 kg/hm&#xb2;, respectively. These results are more accurate than those obtained using FD-FB, with R&#xb2; values improving by 0 to 0.06 and RMSE values decreasing by 29.47 to 148.91 kg/hm&#xb2;. Among the PCR models, FD-Boruta exhibited the highest estimation accuracy, followed by FD-RFE, with FD-FB showing the least accuracy. The R&#xb2; accuracy of FD-Boruta improved by 0.03, 0.19, 0.02, 0.01, and 0.04, respectively, compared to FD-RFE. In contrast, the R&#xb2; accuracy of FD-RFE improved by 0.02, 0.05, 0.07, and 0.01 compared to FD-FB. The outcomes for the SVM and RR models were analogous, although the performances of the three algorithms varied significantly. R&#xb2; ranged from 0.58 to 0.71 for FD-Boruta, 0.22 to 0.74 for FD-RFE, and 0.19 to 0.60 for FD-FB.</p>
<p>Second, the estimation accuracy of AGB by different models under the same feature selection algorithm was compared. For the model constructed with FD-Boruta inputs, when the estimation accuracy was similar, FD-Boruta-PCR demonstrated more stable performance. The estimation outcomes of models based on FD-RFE varied significantly. FD-RFE-PLSR and FD-RFE-PCR provided more precise estimates of rice AGB, whereas the FD-RFE-SVM and FD-RFE-RR models exhibited overfitting in certain stages. The models based on FD-RFE generally showed poor performance, with model R&#xb2; values below 0.65, and the accuracy of the FD-FB-SVM and FD-FB-RR models varied greatly.</p>
<p>Finally, the performance of all model combinations was assessed for estimating AGB effects across different growth stages. In the tillering stage, FD-Boruta-SVM yielded the best estimation, with an R&#xb2; of 0.66 and an RMSE of 34.33 kg/hm&#xb2;. During the jointing stage, FD-Boruta-SVM achieved the highest estimation accuracy, with an R&#xb2; of 0.65 and an RMSE of 985.55 kg/hm&#xb2;, while FD-FB-SVM showed the lowest accuracy, with an R&#xb2; of 0.32 and an RMSE of 1412.37 kg/hm2. In the booting stage, the estimation accuracies R&#xb2; of models using FD-FB and FD-RFE inputs were both above 0.7, with FD-RFE-SVM and FD-Boruta-PCR performing the best, achieving R&#xb2; values of 0.74 and 0.72, respectively, and RMSE values of 1311.04 kg/hm&#xb2; and 1290.24 kg/hm&#xb2;, respectively. At the heading stage, FD-Boruta-PCR had the highest estimation accuracy, with an R&#xb2; of 0.71, while FD-FB-SVM had the lowest accuracy, with an R&#xb2; of 0.30. In the maturity stage, the AGB estimation accuracy of all the models decreased, with R&#xb2; values ranging from 0.19 to 0.53.</p>
<p>In conclusion, models built using the Boruta algorithm are more reliable and exhibit greater stability, among which FD-Boruta-PCR is the most stable, followed by FD-Boruta-PLSR. Considering the model estimation accuracy, the booting period is the most accurately estimated, with R&#xb2; values exceeding 0.7.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<sec id="s4_1">
<label>4.1</label>
<title>Correlations between OS, FD, SD and AGB</title>
<p>An in-depth analysis of the correlation between spectral information and AGB will facilitate a comprehensive understanding of the growth status of rice. This study performed a correlation analysis between different orders of derivative spectrum and AGB at different growth stages of rice. Generally, the correlation between the derivative spectrum of various orders and AGB tended to increase and then decrease throughout the growth stage, potentially due to the influence of the rice growth cycle (<xref ref-type="bibr" rid="B72">Xu et&#xa0;al., 2023</xref>). From the tillering stage to heading stage, as the chlorophyll content in rice leaves increases and the vegetation canopy structure becomes fully developed, the canopy becomes richer in spectral information, which can more accurately reflect crop characteristics (<xref ref-type="bibr" rid="B55">Ren et&#xa0;al., 2018</xref>). In the mature stage, as stems and leaves progressively wither and yellow, the chlorophyll content drops sharply, the spectral characteristics obtained are less able to accurately represent crop growth, leading to a decrease in the correlation between the canopy spectrum and AGB (<xref ref-type="bibr" rid="B74">Yang and Chen, 2004</xref>; <xref ref-type="bibr" rid="B29">He et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B82">Zhang et&#xa0;al., 2019</xref>).</p>
<p>Within the 680~750 nm band range, the correlation between the canopy spectrum and AGB reached its maximum value in different stages (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). This occurs because this band serves as the transition region between the infrared and near-infrared bands, where spectral reflectance transitions rapidly from a low negative correlation to a high positive correlation. This shift is attributed to strong absorption and reflection (<xref ref-type="bibr" rid="B35">Kanke et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B73">Xu et&#xa0;al., 2022</xref>). The correlation between FD and AGB was generally greater than that between OS and SD at the different fertility stages (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>). This observation aligns with the findings of <xref ref-type="bibr" rid="B44">Liang et&#xa0;al. (2018)</xref> and <xref ref-type="bibr" rid="B68">Tong et&#xa0;al. (2023)</xref>. As a method for analyzing spectral information, derivative transform can diminish noise and enhance data accuracy (<xref ref-type="bibr" rid="B43">Li and Xie, 2015</xref>). FD reflects the slope of the spectrum, while SD represents the change in the slope of the reflection spectrum. While SD identifies more absorption peaks, it also introduces noise and may result in errors (<xref ref-type="bibr" rid="B60">Shen et&#xa0;al., 2022</xref>). Therefore, FD is strongly correlated with AGB and can be effectively utilized for estimating rice AGB.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Rice AGB estimation based on different feature selection algorithms</title>
<p>In the realm of feature selection, prior research has demonstrated that employing screened feature variables for model construction enhances the estimation power, inversion accuracy, and utility of the original models (<xref ref-type="bibr" rid="B22">Gao et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B64">Sun et&#xa0;al., 2021</xref>). For example, <xref ref-type="bibr" rid="B79">Yu et&#xa0;al. (2023)</xref> used the SPA algorithm to extract sensitive bands in rice canopy spectral data, and combined with PROSAIL to establish a rice AGB estimation model, achieving high accuracy (R&#xb2;=0.69). This study yielded similar findings, the characteristic band had a greater estimation ability than the original band. The difference is that previous research is usually based on OS and does not involve derivative transform. Therefore, whether the estimation model constructed by derivative transformed spectrum is better than OS remains to be determined. This study performs SG smoothing and derivative transform on OS and selects characteristic bands based on the optimal derivative spectrum. The results show that the Boruta algorithm is more robust than the RFE algorithm, and the selected feature bands are more sensitive, which is conducive to constructing subsequent rice AGB estimation model.</p>
<p>Under identical conditions, the most accurate AGB estimates were achieved using feature bands selected by the Boruta algorithm. This superiority of the Boruta algorithm is attributed to its ability to identify bands of features that are genuinely relevant to the dependent variable, thereby enhancing the prediction accuracy of the model (<xref ref-type="bibr" rid="B41">Kursa and Rudnicki, 2010</xref>), a conclusion that aligns with the findings of <xref ref-type="bibr" rid="B14">Degenhardt et&#xa0;al. (2019)</xref>. However, the RFE algorithm exhibited suboptimal performance in the jointing, heading, and maturity stages. This could be due to the RFE algorithm generates feature subsets with corresponding accuracy by continuously building models. This process may result in retaining a large number of features, leading to significant collinearity between bands and diminishing the model&#x2019;s estimation accuracy (<xref ref-type="bibr" rid="B51">Paul et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B8">Chen et&#xa0;al., 2018</xref>), echoing the research results of <xref ref-type="bibr" rid="B45">Lin et&#xa0;al. (2023)</xref>. The poorest performance was observed when the entire band was utilized as an input variable, attributed to the presence of redundant information and increased collinearity among bands, which impaired the model&#x2019;s estimation capability (<xref ref-type="bibr" rid="B28">Hansen and Schjoerring, 2003</xref>; <xref ref-type="bibr" rid="B50">Pan et&#xa0;al., 2017</xref>).</p>
<p>Compared with the RFE algorithm, the Boruta algorithm identified fewer feature bands (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>); however, the resulting estimation model was more stable. This stability may be due to the characteristic bands determined by the Boruta algorithm being more effective and independent (<xref ref-type="bibr" rid="B52">Poona et&#xa0;al., 2016</xref>). Additionally, when comparing feature bands screened by both the Boruta and RFE algorithms, it was noted that their intersection predominantly occurred in the &#x201c;red edge&#x201d; region. This could be due to the band encapsulates rich crop information and is highly correlated with AGB (<xref ref-type="bibr" rid="B31">Horler et&#xa0;al., 1983</xref>; <xref ref-type="bibr" rid="B18">Filella and Penuelas, 1994</xref>), consistent with the findings of <xref ref-type="bibr" rid="B10">Cheng et&#xa0;al. (2017)</xref>, who assessed the estimation effects of eight vegetation indices on rice canopy composition AGB and found the red edge index to be particularly sensitive to leaf AGB, achieving the highest estimation accuracy.</p>
<p>Another aspect of interest is that the characteristic bands identified by the Boruta algorithm, which are relatively evenly distributed across the spectrum, are predominantly found at wavelengths of 420 nm, 644 nm, 750 nm, and 842 nm. These characteristic bands are mainly located in areas sensitive to crop AGB response and are relatively evenly distributed. During the tillering stage, the characteristic bands are primarily located in the &#x201c;red edge&#x201d; region, which may be due to the low vegetation coverage at this time and the spectrum response is not obvious (<xref ref-type="bibr" rid="B38">Kokaly and Clark, 1999</xref>; <xref ref-type="bibr" rid="B12">Clevers et&#xa0;al., 2001</xref>). In the jointing stage, characteristic wavelengths are observed in the near-infrared region, likely due to the increase in rice canopy biomass, making the wavelength response in this region more pronounced and easier to detect during the selection process (<xref ref-type="bibr" rid="B13">Datt, 1998</xref>). From the heading to the maturity stage, a few characteristic wavelengths in the blue light region are identified, possibly because the chlorophyll content in the leaves gradually decreases, leading to increased spectral reflectance in the blue light region (<xref ref-type="bibr" rid="B77">Yan-lin et&#xa0;al., 2004</xref>). Thus, the Boruta algorithm effectively mines the spectral information of the rice canopy, and the selected characteristic bands align with the spectral response changes in the rice canopy, thereby enhancing the accuracy of AGB estimation.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Rice AGB estimation based on different machine learning algorithms</title>
<p>The performances of various models were meticulously compared, with the PCR model emerging as the most reliable and stable for estimating AGB. The differences between the R<sup>2</sup> values for the modeling set and the validation set are minimal, ranging from 0 to 0.1. Both the RMSE and MAE are lower for the PCR model than for the other models. This superior performance of the PCR model can be attributed to its foundation in predictive data mining technology through principal component analysis (PCA), which efficiently reduces the dimensionality of independent variables, mitigates the effects of multicollinearity among variables, and enhances the model&#x2019;s adaptability (<xref ref-type="bibr" rid="B65">Suryakala and Prince, 2019</xref>). In the PLSR model. Models constructed with three different input variables all demonstrated the ability to estimate rice AGB, particularly at the booting stage, when the R&#xb2; of the validation set exceeded 0.6. This performance is likely due to the robust adaptability of the PLSR algorithm, its ability to diminish the dimensionality of spectral data, its ability to effectively handle complex collinear relationships between independent variables, and its overall enhancement of the model&#x2019;s estimation accuracy (<xref ref-type="bibr" rid="B30">Helland, 2001</xref>). In the SVM model, estimation models built on FD-RFE and FD-FB inputs exhibited overfitting at the jointing, heading, and maturity stages. Due to the excessive number of FD-RFE and FD-FB, when fitting as sample data, the noise interference in the model is large, resulting in an increase in estimation error. Even some noise may be recognized as characteristic frequency bands by machine learning algorithms, destroying the preset classification rules and significantly affecting the accuracy of model estimation (<xref ref-type="bibr" rid="B11">Cherkassky, 1997</xref>; <xref ref-type="bibr" rid="B59">Shafaei and Kisi, 2017</xref>; <xref ref-type="bibr" rid="B54">Raja et&#xa0;al., 2022</xref>). FD-Boruta has a small number but high estimation potential and can solve collinearity problems well when combined with the SVM algorithm. Similar outcomes were also observed in the RR model. This may be because the RR algorithm cannot automatically select important feature variables when fitting sample data. Therefore, when the amount of input sample data is large, it is easily affected by outliers, thereby reducing the model&#x2019;s predictive ability. It may also be that because determining optimal ridge parameters is critical when building an estimation model, poor parameter selection can lead to overfitting of the model, thereby reducing its interpretability (<xref ref-type="bibr" rid="B62">Smith and Campbell, 1980</xref>; <xref ref-type="bibr" rid="B19">Forrester and Kalivas, 2004</xref>). Moreover, this study demonstrates that the model achieves the highest estimation accuracy during the booting stage. This can be ascribed to the booting stage, which is the primary period for increases in rice chlorophyll and is characterized by high vegetation coverage and the absence of panicles. At this juncture, noise interference is minimized, and the spectral information collected is purer and more precise, providing advantageous conditions for estimating rice AGB (<xref ref-type="bibr" rid="B7">Chang et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B67">Takai et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B36">Kawamura et&#xa0;al., 2018</xref>).</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>This study implements SG smoothing and derivative transform for the preprocessing of spectral data, aiming to diminish fluctuations and noise interference. Subsequently, the Boruta and RFE algorithms are applied to select features from the first-order spectrum, thereby reducing the data dimensions and information redundancy and enhancing the data accuracy. A rice AGB estimation model was developed from the tillering stage to the maturity stage by integrating PLSR, PCR, SVM, and ridge regression machine learning algorithms. The key findings of the research are as follows:</p>
<list list-type="simple">
<list-item>
<p>(1) Except during the booting stage, FD exhibited the strongest correlation with AGB across the other four growth stages, followed by OS and then SD. As the rice growth stage progresses, the correlation shows a trend of first increasing and then decreasing.</p>
</list-item>
<list-item>
<p>(2) The performance of the Boruta algorithm is more stable, the selected characteristic bands are more sensitive, and effective dimensionality reduction of spectrum data is achieved. The number of feature strips provided by the RFE algorithm ranges from 3 to 439, and the number of feature strips selected by the Boruta algorithm is within 40.</p>
</list-item>
<list-item>
<p>(3) Among all model combinations, the characteristic band selected by the Boruta algorithm performs best, and FD-Boruta-PCR emerged as the superior model for estimating rice AGB, with R&#xb2; values between 0.45 and 0.72 and RMSE values between 469.15 and 2392.65 kg/hm&#xb2;. The worst performing model is the FD-FB-SVM model, with R&#xb2; values between 0.19 and 0.32 and RMSE values between 701.52 and 2980.00 kg/hm&#xb2;.</p>
</list-item>
<list-item>
<p>(4) As the progression from the tillering stage to the mature stage occurs, the accuracy of the AGB estimation model decreases. Among them, the booting stage was determined to be the most accurate prediction stage, as evidenced by an R&#xb2; of 0.72 and an RMSE of 1290.24 kg/hm&#xb2;.</p>
</list-item>
</list>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YN: Conceptualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Data curation, Formal Analysis. XS: Writing &#x2013; review &amp; editing. HY: Investigation, Writing &#x2013; review &amp; editing. YZ: Methodology, Supervision, Writing &#x2013; review &amp; editing. JL: Formal Analysis, Writing &#x2013; review &amp; editing. WW: Project administration, Writing &#x2013; review &amp; editing. YS: Validation, Writing &#x2013; review &amp; editing. QM: Visualization, Writing &#x2013; review &amp; editing. JKL: Resources, Writing &#x2013; review &amp; editing. XL: Funding acquisition, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This research was funded by Scientific research projects in higher education institutions of Anhui Province (no. 2023AH051855; 2022AH051623); Anhui Province Crop Intelligent Planting and Processing Technology Engineering Research Center Open Research Project (no. ZHKF202303); Natural Science Foundation of Hebei Province (no. C2023408010), and College Students &#x2018; Innovation and Entrepreneur ship Training Project (no. 202210879043; 202310879114; 202310879115).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2024.1396183/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2024.1396183/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abdi</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>L. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Principal component analysis</article-title>. <source>WIREs Comput. Stat</source> <volume>2</volume>, <fpage>433</fpage>&#x2013;<lpage>459</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/wics.101</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Atzberger</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Darvishzadeh</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Immitzer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Schlerf</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Skidmore</surname> <given-names>A.</given-names>
</name>
<name>
<surname>le Maire</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Comparative analysis of different retrieval methods for mapping grassland leaf area index using airborne imaging spectroscopy</article-title>. <source>Int. J. Appl. Earth Observation Geoinformation</source> <volume>43</volume>, <fpage>19</fpage>&#x2013;<lpage>31</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jag.2015.01.009</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bansod</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Thakur</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Singhal</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A comparision between satellite based and drone based remote sensing technology to achieve sustainable development: a review</article-title>. <source>J. Agric. Environ. Int. Dev. (JAEID)</source> <volume>111</volume>, <fpage>383</fpage>&#x2013;<lpage>407</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12895/jaeid.20172.690</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becker</surname> <given-names>B. L.</given-names>
</name>
<name>
<surname>Lusch</surname> <given-names>D. P.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Identifying optimal spectral bands from in <italic>situ</italic> measurements of Great Lakes coastal wetlands using second-derivative analysis</article-title>. <source>Remote Sens. Environ.</source> <volume>97</volume>, <fpage>238</fpage>&#x2013;<lpage>248</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2005.04.020</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>a). <article-title>Hyperspectral inversion of nitrogen content in maize leaves based on different dimensionality reduction algorithms</article-title>. <source>Comput. Electron. Agric.</source> <volume>190</volume>, <elocation-id>106461</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2021.106461</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Tao</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>b). <article-title>Integrating Multi-Source Data for Rice Yield Prediction across China using Machine Learning and Deep Learning Approaches</article-title>. <source>Agric. For. Meteorol.</source> <volume>297</volume>, <elocation-id>108275</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.agrformet.2020.108275</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chang</surname> <given-names>K.-W.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Lo</surname> <given-names>J.-C.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Predicting rice yield using canopy reflectance measured at booting stage</article-title>. <source>Agron. J.</source> <volume>97</volume>, <fpage>872</fpage>&#x2013;<lpage>878</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2134/agronj2004.0162</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Su</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Decision variants for the automatic determination of optimal feature subset in RF-RFE</article-title>. <source>Genes</source> <volume>9</volume>, <elocation-id>301</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes9060301</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>L.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Rapid estimation of leaf nitrogen content in apple-trees based on canopy hyperspectral reflectance using multivariate methods</article-title>. <source>Infrared Phys. Technol.</source> <volume>111</volume>, <elocation-id>103542</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.infrared.2020.103542</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Spectroscopic estimation of biomass in canopy components of paddy rice using dry matter and chlorophyll indices</article-title>. <source>Remote Sens.</source> <volume>9</volume>, <elocation-id>319</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs9040319</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cherkassky</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>The nature of statistical learning theory~</article-title>. <source>IEEE Trans. Neural Netw.</source> <volume>8</volume>, <fpage>1564</fpage>&#x2013;<lpage>1564</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TNN.72</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clevers</surname> <given-names>J. G. P. W.</given-names>
</name>
<name>
<surname>de Jong</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>Epema</surname> <given-names>G. F.</given-names>
</name>
<name>
<surname>van der Meer</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Bakker</surname> <given-names>W. H.</given-names>
</name>
<name>
<surname>Skidmore</surname> <given-names>A. K.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>MERIS and the red-edge position</article-title>. <source>Int. J. Appl. Earth Observation Geoinformation</source> <volume>3</volume>, <fpage>313</fpage>&#x2013;<lpage>320</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0303-2434(01)85038-8</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Datt</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Remote Sensing of Chlorophyll a, Chlorophyll b, Chlorophyll a+b, and Total Carotenoid Content in Eucalyptus Leaves</article-title>. <source>Remote Sens. Environ.</source> <volume>66</volume>, <fpage>111</fpage>&#x2013;<lpage>121</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0034-4257(98)00046-7</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Degenhardt</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Seifert</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Szymczak</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Evaluation of variable selection methods for random forests and omics data sets</article-title>. <source>Briefings Bioinf.</source> <volume>20</volume>, <fpage>492</fpage>&#x2013;<lpage>503</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bib/bbx124</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Demetriades-Shah</surname> <given-names>T. H.</given-names>
</name>
<name>
<surname>Steven</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>High resolution derivative spectra in remote sensing</article-title>. <source>Remote Sens. Environ.</source> <volume>33</volume>, <fpage>55</fpage>&#x2013;<lpage>64</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0034-4257(90)90055-Q</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Devia</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Rojas</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Petro</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Martinez</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Mondragon</surname> <given-names>I. F.</given-names>
</name>
<name>
<surname>Patino</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>High-throughput biomass estimation in rice crops using UAV multispectral imagery</article-title>. <source>J. Intell. Robot Syst.</source> <volume>96</volume>, <fpage>573</fpage>&#x2013;<lpage>589</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10846-019-01001-5</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Xue</surname> <given-names>B.-L.</given-names>
</name>
<name>
<surname>Yinglan</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Controls of carbon flux in a semi-arid grassland ecosystem experiencing wetland loss: Vegetation patterns and environmental variables</article-title>. <source>Agric. For. Meteorol.</source> <volume>259</volume>, <fpage>196</fpage>&#x2013;<lpage>210</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.agrformet.2018.05.002</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Filella</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Penuelas</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>The red edge position and shape as indicators of plant chlorophyll content, biomass and hydric status</article-title>. <source>Int. J. Remote Sens.</source> <volume>15</volume>, <fpage>1459</fpage>&#x2013;<lpage>1470</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/01431169408954177</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Forrester</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Kalivas</surname> <given-names>J. H.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Ridge regression optimization using a harmonious approach</article-title>. <source>J. Chemometrics</source> <volume>18</volume>, <fpage>372</fpage>&#x2013;<lpage>384</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cem.883</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Progress of hyperspectral data processing and modelling for cereal crop nitrogen monitoring</article-title>. <source>Comput. Electron. Agric.</source> <volume>172</volume>, <elocation-id>105321</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105321</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galv&#xe3;o</surname> <given-names>L. S.</given-names>
</name>
<name>
<surname>Formaggio</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Tisot</surname> <given-names>D. A.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Discrimination of sugarcane varieties in Southeastern Brazil with EO-1 Hyperion data</article-title>. <source>Remote Sens. Environ.</source> <volume>94</volume>, <fpage>523</fpage>&#x2013;<lpage>534</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2004.11.012</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Modeling alpine grassland forage phosphorus based on hyperspectral remote sensing and a multi-factor machine learning algorithm in the east of Tibetan Plateau, China</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>147</volume>, <fpage>104</fpage>&#x2013;<lpage>117</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2018.11.015</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Geladi</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Kowalski</surname> <given-names>B. R.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Partial least-squares regression: a tutorial</article-title>. <source>Analytica Chimica Acta</source> <volume>185</volume>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0003-2670(86)80028-9</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gerretzen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Szyma&#x144;ska</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Jansen</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Bart</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Van Manen</surname> <given-names>H.-J.</given-names>
</name>
<name>
<surname>Van Den Heuvel</surname> <given-names>E. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Simple and effective way for data preprocessing selection based on design of experiments</article-title>. <source>Anal. Chem.</source> <volume>87</volume>, <fpage>12096</fpage>&#x2013;<lpage>12103</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/acs.analchem.5b02832</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gitelson</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Merzlyak</surname> <given-names>M. N.</given-names>
</name>
<name>
<surname>Lichtenthaler</surname> <given-names>H. K.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Detection of red edge position and chlorophyll content by reflectance measurements near 700 nm</article-title>. <source>J.&#xa0;Plant Physiol.</source> <volume>148</volume>, <fpage>501</fpage>&#x2013;<lpage>508</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0176-1617(96)80285-9</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gnyp</surname> <given-names>M. L.</given-names>
</name>
<name>
<surname>Miao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Ustin</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Hyperspectral canopy sensing of paddy rice aboveground biomass at different growth stages</article-title>. <source>Field Crops Res.</source> <volume>155</volume>, <fpage>42</fpage>&#x2013;<lpage>55</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fcr.2013.09.023</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guyon</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Weston</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Barnhill</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Vapnik</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Gene selection for cancer classification using support vector machines</article-title>. <source>Mach. Learn.</source> <volume>46</volume>, <fpage>389</fpage>&#x2013;<lpage>422</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1012487302797</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hansen</surname> <given-names>P. M.</given-names>
</name>
<name>
<surname>Schjoerring</surname> <given-names>J. K.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Reflectance measurement of canopy biomass and nitrogen status in wheat crops using normalized difference vegetation indices and partial least squares regression</article-title>. <source>Remote Sens. Environ.</source> <volume>86</volume>, <fpage>542</fpage>&#x2013;<lpage>553</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0034-4257(03)00131-7</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Su</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Estimating leaf area index with a new vegetation index considering the influence of rice panicles</article-title>. <source>Remote Sens.</source> <volume>11</volume>, <elocation-id>1809</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs11151809</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Helland</surname> <given-names>I. S.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Some theoretical aspects of partial least squares regression</article-title>. <source>Chemometrics Intelligent Lab. Syst.</source> <volume>58</volume>, <fpage>97</fpage>&#x2013;<lpage>107</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0169-7439(01)00154-X</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Horler</surname> <given-names>D. N. H.</given-names>
</name>
<name>
<surname>Dockray</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Barber</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1983</year>). <article-title>The red edge of plant leaf reflectance</article-title>. <source>Int. J. Remote Sens.</source> <volume>4</volume>, <fpage>273</fpage>&#x2013;<lpage>288</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/01431168308948546</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ivanda</surname> <given-names>A.</given-names>
</name>
<name>
<surname>&#x160;eri&#x107;</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bugari&#x107;</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Braovi&#x107;</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Mapping chlorophyll-a concentrations in the ka&#x161;tela bay and bra&#x10d; Channel using ridge regression and sentinel-2 satellite images</article-title>. <source>Electronics</source> <volume>10</volume>, <elocation-id>3004</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/electronics10233004</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ji</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Gu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Xi</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Hong</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Huo</surname> <given-names>Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Quantitative monitoring of leaf area index in rice based on hyperspectral feature bands and ridge regression algorithm</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <elocation-id>2777</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14122777</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Su</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Quantitative analysis and hyperspectral remote sensing inversion of rice canopy spad in A cold region</article-title>. <source>Eng. Agr&#xed;c.</source> <volume>42</volume>, <elocation-id>e20220030</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1590/1809-4430-eng.agric.v42n4e20220030/2022</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanke</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tuba&#xf1;a</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Dalen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Harrell</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Evaluation of red and red-edge reflectance-based vegetation indices for rice biomass and grain yield prediction models in paddy fields</article-title>. <source>Precis. Agric.</source> <volume>17</volume>, <fpage>507</fpage>&#x2013;<lpage>530</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11119-016-9433-1</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kawamura</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Ikeura</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Phongchanmaixay</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Khanthavong</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Canopy Hyperspectral Sensing of Paddy Fields at the Booting Stage and PLS Regression can Assess Grain Yield</article-title>. <source>Remote Sens.</source> <volume>10</volume>, <elocation-id>1249</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs10081249</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kawano</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Fujisawa</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Takada</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Shiroishi</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Sparse principal component regression for generalized linear models</article-title>. <source>Comput. Stat Data Anal.</source> <volume>124</volume>, <fpage>180</fpage>&#x2013;<lpage>196</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.csda.2018.03.008</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kokaly</surname> <given-names>R. F.</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>R. N.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Spectroscopic determination of leaf biochemistry using band-depth analysis of absorption features and stepwise multiple linear regression</article-title>. <source>Remote Sens. Environ.</source> <volume>67</volume>, <fpage>267</fpage>&#x2013;<lpage>287</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0034-4257(98)00084-4</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krishnan</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Ramakrishnan</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Reddy</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Reddy</surname> <given-names>V. R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Chapter three - high-temperature effects on rice growth, yield, and grain quality</article-title>. <source>Adv. Agron.</source> <volume>111</volume>, <fpage>87</fpage>&#x2013;<lpage>206</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-12-387689-8.00004-7</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kursa</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Jankowski</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rudnicki</surname> <given-names>W. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Boruta &#x2013; A system for feature selection</article-title>. <source>Fundamenta Informaticae</source> <volume>101</volume>, <fpage>271</fpage>&#x2013;<lpage>285</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3233/FI-2010-288</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kursa</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Rudnicki</surname> <given-names>W. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Feature selection with the boruta package</article-title>. <source>J. Stat. Software</source> <volume>36</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.18637/jss.v036.i11</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Sui</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>UAV-based hyperspectral and ensemble machine learning for predicting yield in winter wheat</article-title>. <source>Agronomy</source> <volume>12</volume>, <elocation-id>202</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy12010202</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Adaptive fractional differential approach and its application to medical image enhancement</article-title>. <source>Comput. Electrical Eng.</source> <volume>45</volume>, <fpage>324</fpage>&#x2013;<lpage>335</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compeleceng.2015.02.013</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Di</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Estimation of leaf nitrogen content in wheat using new hyperspectral indices and a random forest regression algorithm</article-title>. <source>Remote Sens.</source> <volume>10</volume>, <elocation-id>1940</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs10121940</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Ren</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yue</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Eucalyptus plantation area extraction based on SLPSO-RFE feature selection and multi-temporal sentinel-1/2 data</article-title>. <source>Forests</source> <volume>14</volume>, <elocation-id>1864</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/f14091864</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>G.-S.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>H.-S.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.-H.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Vis-NIR spectroscopic pattern recognition combined with SG smoothing applied to breed screening of transgenic sugarcane</article-title>. <source>Guang Pu Xue Yu Guang Pu Fen Xi</source> <volume>34</volume>, <fpage>2701</fpage>&#x2013;<lpage>2706</lpage>.</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lucas</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Van De Kerchove</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Otero</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Lagomasino</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Fatoyinbo</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Omar</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Structural characterisation of mangrove forests achieved through combining multiple sources of remote sensing data</article-title>. <source>Remote Sens. Environ.</source> <volume>237</volume>, <elocation-id>111543</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2019.111543</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mishra</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Biancolillo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Roger</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Marini</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Rutledge</surname> <given-names>D. N.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>New data preprocessing trends based on ensemble of multiple preprocessing techniques</article-title>. <source>TrAC Trends Analytical Chem.</source> <volume>132</volume>, <elocation-id>116045</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.trac.2020.116045</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>1981</year>). <article-title>Principal component analysis in linear systems: Controllability, observability, and model reduction</article-title>. <source>IEEE Trans. Automatic Control</source> <volume>26</volume>, <fpage>17</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TAC.1981.1102568</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.-C.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>Y.-J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X.-D.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Hyperspectral dimensionality reduction by tensor sparse and low-rank graph-based discriminant analysis</article-title>. <source>Remote Sens.</source> <volume>9</volume>, <elocation-id>452</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs9050452</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paul</surname> <given-names>J.</given-names>
</name>
<name>
<surname>D'Ambrosio</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Dupont</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Kernel methods for heterogeneous feature selection</article-title>. <source>Neurocomputing</source> <volume>169</volume>, <fpage>187</fpage>&#x2013;<lpage>195</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2014.12.098</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Poona</surname> <given-names>N. K.</given-names>
</name>
<name>
<surname>Niekerk</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Nadel</surname> <given-names>R. L.</given-names>
</name>
<name>
<surname>Ismail</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Random forest (RF) wrappers for waveband selection and classification of hyperspectral data</article-title>. <source>Appl. Spectrosc. AS</source> <volume>70</volume>, <fpage>322</fpage>&#x2013;<lpage>333</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1177/0003702815620545</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prasad</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Deo</surname> <given-names>R. C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Maraseni</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Weekly soil moisture forecasting with multivariate sequential, ensemble empirical mode decomposition and Boruta-random forest hybridizer algorithm approach</article-title>. <source>CATENA</source> <volume>177</volume>, <fpage>149</fpage>&#x2013;<lpage>166</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.catena.2019.02.012</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raja</surname> <given-names>S. P.</given-names>
</name>
<name>
<surname>Sawicka</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Stamenkovic</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Mariammal</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Crop prediction based on characteristics of the agricultural environment using various feature selection techniques and classifiers</article-title>. <source>IEEE Access</source> <volume>10</volume>, <fpage>23625</fpage>&#x2013;<lpage>23641</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2022.3154350</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Using negative soil adjustment factor in soil-adjusted vegetation index (SAVI) for aboveground living biomass estimation in arid grasslands</article-title>. <source>Remote Sens. Environ.</source> <volume>209</volume>, <fpage>439</fpage>&#x2013;<lpage>445</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2018.02.068</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Savitzky</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Golay</surname> <given-names>M. J. E.</given-names>
</name>
</person-group> (<year>1964</year>). <article-title>Smoothing and differentiation of data by simplified least squares procedures</article-title>. <source>Anal. Chem.</source> <volume>36</volume>, <fpage>1627</fpage>&#x2013;<lpage>1639</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1021/ac60214a047</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schafer</surname> <given-names>R. W.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>What is a savitzky-golay filter? [Lecture notes]</article-title>. <source>IEEE Signal Process. Magazine</source> <volume>28</volume>, <fpage>111</fpage>&#x2013;<lpage>117</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/MSP.2011.941097</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schino</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Borfecchia</surname> <given-names>F.</given-names>
</name>
<name>
<surname>De Cecco</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Dibari</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Iannetta</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Martini</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Satellite estimate of grass biomass in a mountainous range in central Italy</article-title>. <source>Agroforestry Syst.</source> <volume>59</volume>, <fpage>157</fpage>&#x2013;<lpage>162</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1026308928874</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shafaei</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kisi</surname> <given-names>O.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Predicting river daily flow using wavelet-artificial neural networks based on regression analyses in comparison with artificial neural networks and support vector machine models</article-title>. <source>Neural Comput. Applic</source> <volume>28</volume>, <fpage>15</fpage>&#x2013;<lpage>28</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00521-016-2293-9</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Winter wheat SPAD value inversion based on multiple pretreatment methods</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <elocation-id>4660</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14184660</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Visible and near-infrared spectroscopy with multi-parameters optimization of savitzky-golay smoothing applied to rapid analysis of soil cr content of pearl river delta</article-title>. <source>J. Geosci. Environ. Prot.</source> <volume>09</volume>, <fpage>75</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4236/gep.2021.93006</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Campbell</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>1980</year>). <article-title>A critique of some ridge regression methods</article-title>. <source>J.&#xa0;Am. Stat. Assoc.</source> <volume>75</volume>, <fpage>74</fpage>&#x2013;<lpage>81</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/01621459.1980.10477428</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spiertz</surname> <given-names>J. H. J.</given-names>
</name>
<name>
<surname>Ewert</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Crop production and resource use to meet the growing demand for food, feed and fuel: opportunities and constraints</article-title>. <source>NJAS: Wageningen J. Life Sci.</source> <volume>56</volume>, <fpage>281</fpage>&#x2013;<lpage>300</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S1573-5214(09)80001-8</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Potential of multivariate statistical technique based on the effective spectra bands to estimate the plant water content of wheat under different irrigation regimes</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.631573</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suryakala</surname> <given-names>S. V.</given-names>
</name>
<name>
<surname>Prince</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Investigation of goodness of model data fit using PLSR and PCR regression models to determine informative wavelength band in NIR region for non-invasive blood glucose prediction</article-title>. <source>Opt Quant Electron</source> <volume>51</volume>, <fpage>271</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11082-019-1985-7</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suykens</surname> <given-names>J. A. K.</given-names>
</name>
<name>
<surname>Vandewalle</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Least squares support vector machine classifiers</article-title>. <source>Neural Process. Lett.</source> <volume>9</volume>, <fpage>293</fpage>&#x2013;<lpage>300</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1018628609742</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Takai</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Matsuura</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Nishio</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ohsumi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Shiraiwa</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Horie</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Rice yield potential is closely related to crop growth rate during late reproductive period</article-title>. <source>Field Crops Res.</source> <volume>96</volume>, <fpage>328</fpage>&#x2013;<lpage>335</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fcr.2005.08.001</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tong</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>V. P.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Estimation of grassland aboveground biomass combining optimal derivative and raw reflectance vegetation indices at peak productive growth stage</article-title>. <source>Geocarto Int.</source> <volume>38</volume>, <elocation-id>2186497</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10106049.2023.2186497</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tunca</surname> <given-names>E.</given-names>
</name>
<name>
<surname>K&#xf6;ksal</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>&#xd6;zt&#xfc;rk</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Akay</surname> <given-names>H.</given-names>
</name>
<name>
<surname>&#xc7;etin Taner</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Accurate estimation of sorghum crop water content under different water stress levels using machine learning and hyperspectral data</article-title>. <source>Environ. Monit Assess.</source> <volume>195</volume>, <fpage>877</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10661-023-11536-8</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Study on hyperspectral remote sensing estimation models about aboveground fresh biomass of rice</article-title>. <source>Remote Sens. Modeling Ecosyst. Sustainability (SPIE)</source>, <fpage>336</fpage>&#x2013;<lpage>345</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1117/12.557403</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Estimation of biomass in wheat using random forest regression algorithm and remote sensing data</article-title>. <source>Crop J.</source> <volume>4</volume>, <fpage>212</fpage>&#x2013;<lpage>219</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cj.2016.01.008</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Dynamic estimation of rice aboveground biomass based on spectral and spatial information extracted from hyperspectral remote sensing images at different combinations of growth stages</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>202</volume>, <fpage>169</fpage>&#x2013;<lpage>183</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2023.05.021</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Integrating the textural and spectral information of UAV hyperspectral images for the improved estimation of rice aboveground biomass</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <elocation-id>2534</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14112534</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>C.-M.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>R.-K.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Modeling rice growth with hyperspectral reflectance data</article-title>. <source>Crop Sci.</source> <volume>44</volume>, <fpage>1283</fpage>&#x2013;<lpage>1290</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci2004.1283</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Modeling grassland above-ground biomass based on artificial neural network and remote sensing in the Three-River Headwaters Region</article-title>. <source>Remote Sens. Environ.</source> <volume>204</volume>, <fpage>448</fpage>&#x2013;<lpage>455</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2017.10.011</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Estimating biophysical parameters of rice with remote sensing data using support vector machines</article-title>. <source>Sci. China Life Sci.</source> <volume>54</volume>, <fpage>272</fpage>&#x2013;<lpage>281</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11427-011-4135-4</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan-lin</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Jing-feng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Ren-chao</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Change law of hyperspectral data in related with chlorophyll and carotenoid in rice at different developmental stages</article-title>. <source>Rice Sci.</source> <volume>11</volume>, <fpage>274&#x2013;282</fpage>.</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yoosefzadeh-Najafabadi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Earl</surname> <given-names>H. J.</given-names>
</name>
<name>
<surname>Tulpan</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Sulik</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Eskandari</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Application of machine learning algorithms in plant breeding: predicting yield from hyperspectral reflectance in soybean</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.624273</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Inversion of rice leaf biomass based on PROSAIL model optimization</article-title>. <source>J. Huazhong Agric. Univ. (Natural Sci. Edition) (English Edition)</source> <volume>42</volume>, <fpage>187</fpage>&#x2013;<lpage>194</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.13300/j.cnki.hnlkxb.2023.03.022</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Xing</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>A study of nitrogen deficiency inversion in rice leaves based on the hyperspectral reflectance differential</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.573272</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yue</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Estimate of winter-wheat above-ground biomass based on UAV ultrahigh-ground-resolution image textures and vegetation indices</article-title>. <source>ISPRS J. Photogrammetry Remote Sens.</source> <volume>150</volume>, <fpage>226</fpage>&#x2013;<lpage>244</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2019.02.022</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>Q.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Predicting rice grain yield based on dynamic changes in vegetation indexes during early to mid-growth stages</article-title>. <source>Remote Sens.</source> <volume>11</volume>, <elocation-id>387</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs11040387</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Hyperspectral modeling of soil organic matter based on characteristic wavelength in east China</article-title>. <source>Sustainability</source> <volume>14</volume>, <elocation-id>8455</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/su14148455</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>