<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2025.1507442</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Deep learning and hyperspectral features for seedling stage identification of barnyard grass in paddy field</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Tan</surname>
<given-names>Siqiao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xie</surname>
<given-names>Qiang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Wenshuai</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Deng</surname>
<given-names>Yangjun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Lei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yu</surname>
<given-names>Xiaoqiao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yuan</surname>
<given-names>Zheming</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1154394"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chen</surname>
<given-names>Yuan</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/781309"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Information and Intelligent Science and Technology, Hunan Agricultural University</institution>, <addr-line>Changsha, Hunan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>College of Plant Protection, Hunan Agricultural University</institution>, <addr-line>Changsha, Hunan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Hunan Engineering and Technology Research Centre for Agricultural Big Data Analysis and Decision-Making, Hunan Agricultural University</institution>, <addr-line>Changsha, Hunan</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Ecological Simulation Breeding and Phenotype ldentification Platform, Yuelu Mountain Laboratory of Hunan Province</institution>, <addr-line>Changsha, Hunan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Yunchao Tang, Dongguan University of Technology, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Omid Memarian Sorkhabi, Aberystwyth University, United Kingdom</p>
<p>Wioleta Wasilewska-D&#x119;bowska, University of Warsaw, Poland</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Yuan Chen, <email xlink:href="mailto:chenyuan0510@126.com">chenyuan0510@126.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>07</day>
<month>02</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2025</year>
</pub-date>
<volume>16</volume>
<elocation-id>1507442</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>01</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Tan, Xie, Zhu, Deng, Zhu, Yu, Yuan and Chen</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Tan, Xie, Zhu, Deng, Zhu, Yu, Yuan and Chen</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Barnyard grass, a pernicious weed thriving in rice fields, poses a significant challenge to agricultural productivity. Detection of barnyard grass before the four-leaf stage is critical for effective control measures. However, due to their striking visual similarity, separating them from rice seedlings at early growth stages is daunting using traditional visible light imaging models. To explore the feasibility of hyperspectral identification of barnyard grass and rice in the seedling stage, we have pioneered the DeepBGS hyperspectral feature parsing framework. This approach harnesses the power of deep convolutional networks to automate the extraction of pertinent information. Initially, a sliding window-based technique is employed to transform the one-dimensional spectral band sequence into a more interpretable two-dimensional matrix. Subsequently, a deep convolutional feature extraction module, ensembled with a bilayer LSTM module, is deployed to capture both global and local correlations inherent within hyperspectral bands. The efficacy of DeepBGS was underscored by its unparalleled performance in discriminating barnyard grass from rice during the critical 2-3 leaf stage, achieving a 98.18% accuracy rate. Notably, this surpasses the capabilities of other models that rely on amalgamations of machine learning algorithms and feature dimensionality reduction methods. By seamlessly integrating deep convolutional networks, DeepBGS independently extracts salient features, indicating that hyperspectral imaging technology can be used to effectively identify barnyard grass in the early stages, and pave the way for the development of advanced early detection systems.</p>
</abstract>
<kwd-group>
<kwd>hyperspectral features</kwd>
<kwd>rice</kwd>
<kwd>barnyard grass</kwd>
<kwd>convolutional neural network</kwd>
<kwd>DeepBGS</kwd>
<kwd>sliding window</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="3"/>
<equation-count count="7"/>
<ref-count count="28"/>
<page-count count="11"/>
<word-count count="5220"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Technical Advances in Plant Science</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Barnyard grass, a pernicious weed with global ramifications, presents a formidable threat to agricultural ecosystems. Competing relentlessly with rice for essential resources such as light, water, nutrients, and space, it undermines the productivity of rice crops. Moreover, its presence fosters a conducive environment for pests and diseases, exacerbating the risk of diminished crop quality and yield. Early intervention is paramount in mitigating the spread of barnyard grass, ideally before it attains the 3-4 leaf stage, as its resistance to herbicides escalates with maturity. The eradication of mature barnyard grass poses considerable challenges, often necessitating excessive chemical interventions. Such practices not only foster herbicide resistance but also precipitate environmental degradation, jeopardizing the health of rice crops.</p>
<p>Precise field monitoring stands as the linchpin for timely barnyard grass control. However, conventional methods of manual identification are marred by their labor-intensive and time-consuming nature, rendering large-scale monitoring of barnyard grass outbreaks impractical. Hence, there arises an urgent need for the development of high-throughput and precise early detection techniques to effectively curb its proliferation, curtail herbicide usage, and enhance overall operational efficiency. In contrast to the conventional dryland weed identification methods, the recognition of weeds in rice fields predominantly relies on unmanned aerial vehicle (UAV) remote sensing image segmentation techniques. For instance, <xref ref-type="bibr" rid="B9">Huang et&#xa0;al. (2018)</xref> proposed a weed mapping and prescription map generation model, leveraging an enhanced fully convolutional network -4 (FCN-4) architecture for identifying Cyperus iric and Leptochloa chinensis in rice fields. Their approach yielded impressive overall accuracy and mean intersection over union (mean IU) scores of 0.9196 and 0.8473, respectively. Moreover, <xref ref-type="bibr" rid="B17">Ma et&#xa0;al. (2019)</xref> introduced a semantic segmentation method based on a fully convolutional network with the segmentation network (SegNet) model, achieving a mean average precision (MAP) of 0.927 by directly extracting features from initial RGB images and recognizing pixels corresponding to rice, background, and Sagittaria trifolia in paddy field images. Additionally, <xref ref-type="bibr" rid="B12">Lan et&#xa0;al. (2021)</xref> proposed improved feature fusion branch-bilateral segmentation network V2 (FFB-BiSeNetV2) models for real-time identification of rice weeds by UAV low-altitude remote sensing, achieving a pixel accuracy of 93.09% and a mean Intersection over union ratio of 80.28%. Furthermore, <xref ref-type="bibr" rid="B11">Kamath et&#xa0;al. (2020)</xref> investigated multiple classifier systems built using support vector machines (SVM) and random forest (RF) classifiers for classifying paddy crops and weeds from digital images, achieving an accuracy of 91.36%. <xref ref-type="bibr" rid="B21">Peng et&#xa0;al. (2022)</xref> devised the weed detection model based on RetinaNet, specifically addressing the challenge of overlapping between rice and various weed species. Their model achieved exceptional results with a high MAP of 94.1% on a dataset containing rice and eight distinct weed categories for object detection. Indeed, discerning barnyard grass from rice seedlings during their initial growth phases presents a formidable challenge, primarily owing to their remarkably similar visual appearances (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). This visual conundrum poses a significant obstacle for traditional visible-light imaging models, which often struggle to differentiate between the two with precision. Consequently, as of now, there exists no viable method leveraging visible light imaging models for accurately identifying barnyard grass seedlings.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Comparison of seedling morphology between rice and barnyard grass. Plants designated as 1, 3, 5, and 7 represent rice, while those marked as 2, 4, 6, and 8 correspond to barnyard grass.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g001.tif"/>
</fig>
<p>Hyperspectral (HS) emerges as a potent tool for extracting both structural and physiological insights from plants, effectively circumventing the limitations of RGB imaging in distinguishing species with similar phenotypes (<xref ref-type="bibr" rid="B18">Mishra et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B1">Amigo and Grassi, 2019</xref>; <xref ref-type="bibr" rid="B15">Liu et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B24">Sari&#x107; et&#xa0;al., 2022</xref>). <xref ref-type="bibr" rid="B14">Li et&#xa0;al. (2021)</xref> demonstrated the efficacy of hyperspectral imaging data coupled with machine learning techniques in discriminating between two broadleaf weed species, Ranunculus acris (Giant buttercup) and Cirsium arvense (Californian thistle), achieving an impressive accuracy of 89.1%. Similarly, <xref ref-type="bibr" rid="B6">Diao et&#xa0;al. (2022)</xref> proposed a practical technical approach for rapidly training and identifying hyperspectral images of corn seedlings and weeds using a lightweight three-dimensional convolutional neural network, achieving an outstanding average recognition accuracy of 98.58%. It&#x2019;s noteworthy that while <xref ref-type="bibr" rid="B28">Zhang et&#xa0;al. (2019)</xref> developed a SVM-based classification model leveraging six crucial spectral features selected by successive projections algorithm (SPA), yielding a commendable recognition rate of 97% for barnyard grass, weedy rice, and rice. However, their focus was primarily on the tillering stage rather than the seedling stage.</p>
<p>A plethora of wavebands in HS data offers rich information but also presents analytical challenges (<xref ref-type="bibr" rid="B24">Sari&#x107; et&#xa0;al., 2022</xref>). Crafting algorithms to dissect hyperspectral image data is pivotal in maximizing the potential of hyperspectral technology. In this study, we propose an automatic framework, deep learning-based identification model for barnyard grass in seeding stage (DeepBGS), for hyperspectral feature extraction based on convolutional neural networks (CNNs), aimed at precisely recognizing barnyard grass and rice at the seedling stage. Initially, preprocessed hyperspectral band sequences undergo segmentation into multiple overlapping subsequences, which are then transformed into a sequence matrix. Subsequently, a convolutional module featuring an attention mechanism is constructed to automatically extract correlation information between local and global bands. Independent tests unequivocally the superiority of DeepBGS over the reference model, achieving 98.18% accuracy in distinguishing barnyard grass and rice at the 2-3 leaf stage.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Data acquisition</title>
<p>The study employed rice and barnyard grass specimens cultivated indoors under meticulously controlled conditions. These conditions ensured a temperature range of 25-28&#xb0;C, humidity levels ranging between 40-70%, and a regulated 12-hour exposure to light. Only specimens of impeccable quality, devoid of any pest infestations or diseases, were chosen for leaf hyperspectral data collection. Spectral reflectance measurements of the leaves were conducted using a ground truth spectrometer (Field Spec Pro FR2500 spectrometer). This device boasted a wavelength range spanning from 350 to 2500 nm, with a sampling interval of 1.4 nm and a spectral resolution of 3 nm within 350-1000 nm range, and a sampling interval of 2.0 nm with a spectral resolution of 10 nm within 1000-2500 nm range. Leaf blade measurements were meticulously performed using leaf clamps within the canopy position of plants. Prior to each measurement, adjustments to the spectrometer parameters were meticulously carried out using the RS3 software, and spectral calibration against a whiteboard was conducted. To ensure robustness and accuracy, five consecutive samples were collected for each measurement, and the average value was calculated. A total of 660 samples were collected across three batches, comprising 313 rice and 347 barnyard grass specimens. The training set included 495 samples, incorporating data from the first two batches, with 243 rice and 252 barnyard grass samples. The test set, derived from the third batch, consisted of 70 rice and 95 barnyard grass specimens.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Data preprocessing</title>
<p>The dataset amassed in this investigation comprises spectral band reflectance data, with each sample encapsulating 2151 band reflectance values (<xref ref-type="fig" rid="f3">
<bold>Figure 3A</bold>
</xref>). To fortify the reliability of the spectral data for subsequent analysis, four preprocessing methodologies were employed: standard normal variate transformation (SNV) (<xref ref-type="bibr" rid="B4">Bi et&#xa0;al., 2016</xref>), moving average (MA) (<xref ref-type="bibr" rid="B26">Timothy and Anuradha, 2023</xref>), savitzky golay smoothing (SG) (<xref ref-type="bibr" rid="B16">Luo et&#xa0;al., 2005</xref>), and mean centering (MC) (<xref ref-type="bibr" rid="B10">Ijomah, 2019</xref>). These methods served to mitigate data noise and rectify wavelength shifts, thus enhancing the overall quality and integrity of the spectral data. SNV, for instance, functions to rectify scale differences such as tilts or spikes, thereby accentuating the dynamic components of the spectral data. MA, on the other hand, operates by smoothing the dataset through point averaging within a window, effectively mitigating noise influence and suppressing periodic noise. SG, renowned for its efficacy in managing spikes and data variations, smooths the signal by attenuating high-frequency noise components. Lastly, MC plays a pivotal role in dataset rectification, eradicating biases stemming from measurement disparities, inherent variations, or substantial value discrepancies. The original spectral reflectance data and preprocessed data are shown in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Raw spectral reflectance data and preprocessed data. The plots marked as <bold>(A&#x2013;E)</bold> represent the reflectance map of the original spectral data, the SNV preprocessing result, the MA preprocessing result, the SG preprocessing result and the MC preprocessing result.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g002.tif"/>
</fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Subsequence division</title>
<p>Consider a comprehensive breakdown of the preprocessing steps: employing a window length denoted as &#x201c;<italic>w</italic>&#x201d; and a sliding step designated as &#x201c;<italic>s</italic>&#x201d;, the preprocessed hyperspectral data, comprising &#x201c;<italic>m</italic>&#x201d; bands, is meticulously partitioned into (<italic>m</italic>-<italic>w</italic>)/<italic>s</italic>+1 segments. Notably, the final subsequence necessitates an extension in reverse to address any potential length discrepancies. Following this segmentation process, the divided subsequences undergo transformation into a two-dimensional matrix, as depicted in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>. This transformation sets the stage for the extraction of local band correlation features through the utilization of a sophisticated deep convolutional network.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Workflow of DeepBGS. <bold>(A)</bold> illustrates the process of raw data acquisition and preprocessing. <bold>(B)</bold> shows the process of subsequence partitioning. <bold>(C)</bold> depicts the backbone of DeepBGS.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g003.tif"/>
</fig>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Feature extraction module of DeepBGS</title>
<p>Following the subsequence transformation, each sample is epitomized by an <italic>n</italic>&#xd7;<italic>w</italic> two-dimensional matrix, wherein <italic>n</italic> signifies the number of subsequences and <italic>w</italic> denotes the window length. This matrix stands as the foundational input layer of DeepBGS. Subsequently, the tensor of the <italic>n</italic>&#xd7;<italic>w</italic> matrix traverses through the initial convolutional layer, endowed with rectified linear unit (ReLU) activation and a batch normalization (BN) layer. This layer, housing 16 filters of size 3&#xd7;4 with a stride of 1, amplifies the dimensionality of the initial single-channel data, thus enhancing network expressiveness. The data then progresses through three consecutive feature extraction convolutional modules, each composed of two 3&#xd7;3 convolutional layers, an attention mechanism layer, and a 2&#xd7;2 max pooling layer. Notably, the attention mechanism layer harnesses a 3&#xd7;3 convolutional kernel from the convolutional block attention module (CBAM), bolstering network feature expression and local region expression by integrating both channel and spatial attention. Meanwhile, the maximum pooling layer down samples the feature layer with a step size of 2&#xd7;2. These three convolutional modules contain 32, 64, and 128 filters, respectively. Subsequent to this, the data is downscaled using two convolutional layers, each containing 64 filters, and then merged into a two-layer long-short term memory (LSTM) module with 32 hidden units, and two ReLU-based fully connected layers, featuring 32 and 64 output units, respectively, are incorporated. Regularization is implemented with a dropout probability of 50%, fortifying model generalization. Finally, the output layer employs the <italic>Softmax</italic> function to yield the probability of a sample belonging to rice. The parameters of DeepBGS are optimized using the <italic>Adam Optimizer</italic>, with a learning rate of 5<italic>e</italic>-6, a weight decay parameter of 0.0001, and training epochs and batch sizes set at 150 and 11, respectively. The structure of DeepBGS is shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3C</bold>
</xref>.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Reference models</title>
<p>Four traditional machine learning methods, including decision tree (DT) (<xref ref-type="bibr" rid="B25">Song and Lu, 2015</xref>), random forest (RF) (<xref ref-type="bibr" rid="B5">Breiman, 2001</xref>), SVM (<xref ref-type="bibr" rid="B8">Hearst et&#xa0;al., 1998</xref>) and extreme gradient boosting (XGBoost) (<xref ref-type="bibr" rid="B20">Osman et&#xa0;al., 2021</xref>) classifiers were used alongside four deep learning models&#x2014;DeepBGS-NoLSTM, ResNet, VGG and multi-layer perceptrons (MLP) (<xref ref-type="bibr" rid="B23">Riedmiller, 1994</xref>) &#x2014; to evaluate the performance of DeepBGS model. The DT model was implemented using the <italic>R</italic> package <italic>part 4.1-15</italic>, and the tree was pruned by the optimal <italic>C</italic> parameter value with the least cross-validated error. For the RF model, The <italic>R</italic> package <italic>random Forest 4.6-14</italic> was utilized, with parameters <italic>ntree</italic> and <italic>mtry</italic> set to 500 and <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mtext>No</mml:mtext>
<mml:mo>.</mml:mo>
<mml:mtext>&#xa0;of&#xa0;features</mml:mtext>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</inline-formula>, respectively. The radial basis function (RBF) based-SVM model was executed using the Library for SVM, available at <ext-link ext-link-type="uri" xlink:href="https://www.csie.ntu.edu.tw/%7Ecjlin/libsvm/index.html">https://www.csie.ntu.edu.tw/%7Ecjlin/libsvm/index.html</ext-link>, A 10-fold cross-validation (10 CV) approach on the training set was used to optimize penalty parameters <italic>C</italic> (<italic>C</italic>&#x2208;[2<sup>-5</sup>, 2<sup>15</sup>]) and <italic>g</italic> parameter <italic>g</italic> (<italic>g</italic>&#x2208;[2<sup>-15</sup>, 2<sup>3</sup>]). XGBoost was implemented based on the Python <italic>sklearn</italic> library with default parameters. The MLP consists of three fully connected layers, where each hidden layer followed by a non-linear transformation employing the <italic>ReLU</italic> activation function. The output parameters of the initial two hidden layers were configured to have 1024 units, while the output layer employed the <italic>softmax</italic> activation function. DeepBGS-NoLSTM was akin to DeepBGS but the LSTM module was replaced by full connectivity layer. ResNet and VGG adopted 18-layer and 10-layer network architectures, respectively, which were implemented using the <italic>PyTorch</italic> framework.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Feature engineering</title>
<p>The primary challenge inherent in the analysis of multivariate hyperspectral data analysis lies in the necessity to represent a considerable number of wavebands, which significantly elevates the dimensionality of the data. Therefore, performing hyperspectral data dimension reduction becomes essential to mitigate data redundancy and extract valuable knowledge (<xref ref-type="bibr" rid="B24">Sari&#x107; et&#xa0;al., 2022</xref>). In this study, three types of feature engineering methods were explored, including feature dimensionality reduction, feature selection, and vegetation indices, to enhance the model&#x2019;s prediction performance with high-dimensional bands.</p>
<p>Two techniques, principal component analysis (PCA) (<xref ref-type="bibr" rid="B27">Wold et&#xa0;al., 1987</xref>) and t-distributed stochastic neighbor embedding (t-SNE) (<xref ref-type="bibr" rid="B3">Belkina et&#xa0;al., 2019</xref>), were employed for feature dimensionality reduction. The determination of final dimensions was grounded on the principle of achieving optimal 10-fold cross-validated accuracy within the training set. Implementation of both PCA and t-SNE was facilitated through the Python <italic>sklearn</italic> library. Successive projections algorithm (SPA, <ext-link ext-link-type="uri" xlink:href="https://gitee.com/aBugsLife/SPA">https://gitee.com/aBugsLife/SPA</ext-link>) (<xref ref-type="bibr" rid="B2">Ara&#xfa;jo et&#xa0;al., 2001</xref>) and consecutive adaptive reweighted sampling (<xref ref-type="bibr" rid="B13">Li et&#xa0;al., 2009</xref>) (CARS, <ext-link ext-link-type="uri" xlink:href="https://gitee.com/aBugsLife/CARS">https://gitee.com/aBugsLife/CARS</ext-link>) were utilized for the selection of important hyperspectral spectral bands. SPA employs a method that initially selects variables with the lowest covariance and redundancy while maximizing the projection vector in vector space. Subsequently, the final retained bands are determined based on the optimal principle of 10-fold cross-validated accuracy within the training set. Conversely, CARS utilizes a different approach. It began by retaining points with larger absolute weights of the regression coefficients in the partial least squares regression (PLS) model through adaptive reweighted sampling (ARS). It then iteratively builds PLS models based on the new subset, selecting wavelengths with the smallest root mean square error (RMSE) of cross-validation for the PLS model as the characteristic wavelengths after several calculations.</p>
<p>Ultimately, we diminished the dimensionality of the original data features by extracting spectral vegetation indices. A total of types of vegetation indices were extracted, including normalized difference vegetation index (NDVI), ratio vegetation index (RVI), triangular vegetation index (TVI), photochemical reflectance index (PRI), and normalized pigment chlorophyll ratio index (NPCI). These indices were constructed using the following formula:</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mtext>NDVI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>NIR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>VR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mtext>NIR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mtext>VR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mtext>RVI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>NIR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mtext>VR</mml:mtext>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mtext>r</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mtext>TVI</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>0.5</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mn>120</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>750</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>550</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>200</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>650</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>550</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mtext>PRI</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>531</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>570</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>531</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>570</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mtext>NPCI</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>680</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>430</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>680</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mtext>R</mml:mtext>
<mml:mrow>
<mml:mn>430</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The bands <italic>r</italic>
<sub>1</sub> and <italic>r</italic>
<sub>2</sub> correspond to distinct regions of the light spectrum, with <italic>r</italic>
<sub>1</sub> encompassing the near-infrared region and <italic>r</italic>
<sub>2</sub> encompassing the infrared region. Specifically, <italic>r</italic>
<sub>1</sub> comprises wave lengths of 724nm, 738nm, 750nm, 764nm, 776nm, 790nm, 802nm, and 814nm, while <italic>r<sub>2</sub>
</italic> consists of 601nm, 605nm, 614nm, 627nm, 6336nm, 644nm, 652nm, 660nm, 669nm, and 677nm. Leveraging these bands, we derived 80 features for the NDVI and 80 features for the RVI. Additionally, we formulated a TVI feature utilizing wavelengths 750nm, 550nm, and 650nm, a PRI feature using wave-lengths 531nm and 570nm, and an NPCI feature using wavelengths 680nm and 430nm. In total, 163 vegetation index features were extracted from the hyperspectral data.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Evaluation indicators</title>
<p>Accuracy (ACC), area under the curve (AUC), and matthews correlation coefficient (MCC) are utilized as evaluation metrics to assess the performance of the model predictions. These metrics are defined as follows:</p>
<disp-formula id="eq6">
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mtext>ACC</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq7">
<label>(7)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:mtext>MCC</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>FN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
<mml:mo>+</mml:mo>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where TP, TN, FP, and FN represent true positive, true negative, false positive, and false negative, respectively. The receiver operating characteristic (ROC) curve illustrates the true-positive rate against the false-positive rate (1 - specificity) for various thresholds. The AUC of the ROC curve is analyzed to provide a comprehensive metric for evaluating prediction methods. Higher values of ACC, MCC, and AUC indicate better prediction ability.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>A conventional machine learning-based model for classifying barnyard grass and rice at seedling stage</title>
<p>We initially assessed the performance of traditional machine learning models in aiding the hyper-spectral differentiation between barnyard grass and rice during the seedling stage. Additionally, we investigated the impact of various data preprocessing methods on model performance. Hyperspectral data, subjected to diverse various preprocessing techniques, constituted the input data for the traditional machine learning models, and the prediction results for independent test set of each model are illustrated in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. Among the four traditional machine learning models, XGBoost exhibited the most predictive performance, with average ACC, MCC, and AUC values reaching 0.9261, 0.8499, and 0.9579, respectively. Following XGBoost, the SVM model emerged as the second best, achieving average ACC, MCC, and AUC of 0.9224, 0.8415, and 0.9565, respectively. In contrast, the DT model displayed the lowest prediction accuracy, with average ACC, MCC, and AUC metrics of only 0.8982, 0.7920, and 0.8920, respectively. Compared to the original data, all four types of preprocessing methods effectively improved the model prediction performance, with SNV exhibiting the most notable improvement. SNV yielded average ACC, MCC, and AUC values of 0.9212, 0.8420, and 0.9653, respectively. Overall, irrespective of preprocessing or the choice of machine learning algorithms, the ACC and MCC of the hyperspectral-based machine learning model consistently surpassed 0.88 and 0.76, respectively, in distinguishing between barnyard grass and rice during the seedling stage. These findings underscore the potential of hyperspectral data in distinguishing between barnyard grass and rice at the seedling stage.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Comparative analysis of various evaluation metrics for traditional machine learning with different preprocessing techniques. <bold>(A&#x2013;C)</bold> show the performance comparison of ACC, MCC, and AUC respectively. The numbers above the bars in the figure indicate the average scores of the metrics for the five models under each preprocessing algorithm.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g004.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Classification model based on feature dimensionality reduction</title>
<p>To enhance the predictive accuracy of our models, we employed three distinct feature engineering strategies aimed at reducing its dimensionality: feature dimensionality reduction, feature selection, and vegetation index conversion. We applied spectral data after SNV pre-processing for both feature dimensionality reduction and feature selection, while vegetation index conversion was conducted based on the original spectral reflectance data. For PCA and t-SNE, we determined the optimal retained dimensionality by evaluating 10-fold cross-validation ACC using XGBoost on training set. PCA&#xa0;retained thirty principal components, while t-SNE retained twelve features. The SPA band selection process and the CARS band selection process were visualized in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>. As the number of characteristic bands increases, the RMSE value decreases and levels off. When the RMSE stabilizes and reaches its optimum, the value is 0.2462. At this point, the SPA retained 16 bands, comprising wavelengths such as 678nm, 457nm, 693nm, 1410nm, 2182nm, 1951nm, 354nm, 2481nm, 376nm, 2483nm, 381nm, 374nm, 1619nm, 2485nm,2486 and 2488nm. In <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>, the number of bands gradually decreases and stabilizes, while <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref> shows a decreasing trend followed by an increase. At a sampling number of 21, the RMSECV reaches its minimum, leading to the selection of the bands obtained from the 21<sup>th</sup> sampling as the characteristic wavelengths, totaling 108 wavelengths. Additionally, we derived 163 vegetation index features through band conversion.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Feature selection process. The plots marked as <bold>(A, B)</bold> represent the CARS feature selection process, and those marked as <bold>(C, D)</bold> represent the SPA feature selection process. <bold>(A)</bold> shows how the number of selected variables changes as the sample size increases and <bold>(B)</bold> illustrates the variation in cross-validation RMSE values with an increasing number of samples. the process of variable selection and the results of variable selection based on SPA algorithm are presented in the diagrams labeled <bold>(C, D)</bold>, respectively.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g005.tif"/>
</fig>
<p>Drawing from important features retained by various feature engineering strategies, we constructed traditional machine learning models and presented the results of independent tests in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. Utilizing vegetation index features, the average ACC and MCC of the four machine learning models were 0.9152 and 0.8311, respectively, notably lower than those of the prediction model based on the full band, where the average ACC and MCC were 0.9212 and 0.8420, respectively. Following PCA downscaling, the model prediction accuracy showed slight improvement Compared to the full band except for the DT model, registering an average ACC and MCC of 0.9353 and 0.8712, yet, the DT model experiences a slight reduction, primarily observed in the decline of ACC and MCC to 0.8242 and 0.6583. However, t-SNE, SPA, and CARS feature downscaling methods exhibited enhanced model prediction performance compared to full-band modeling. Among these, the t-SNE feature dimensionality reduction method demonstrated the most significant improvement, with an average ACC and MCC of 0.9409 and 0.8800, respectively. The SVM model based on the retained features of SPA exhibited the best prediction outcomes, attaining an ACC and MCC of 0.9455 and 0.8886, respectively. These findings indicate the effectiveness of feature dimensionality reduction methods, particularly t-SNE, in enhancing the performance of traditional machine learning models.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Performance impact of different feature dimensionality reduction methods on traditional machine learning models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Feature engineering <break/>strategies</th>
<th valign="middle" align="center">Evaluation Measures</th>
<th valign="middle" align="center">Dt</th>
<th valign="middle" align="center">RF</th>
<th valign="middle" align="center">SVM</th>
<th valign="middle" align="center">Xgboost</th>
<th valign="middle" align="center">Average</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">PCA</td>
<td valign="middle" align="center">ACC</td>
<td valign="top" align="center">0.8242</td>
<td valign="top" align="center">0.9394</td>
<td valign="top" align="center">0.9333</td>
<td valign="top" align="center">0.9333</td>
<td valign="middle" align="center">0.9076</td>
</tr>
<tr>
<td valign="middle" align="center"/>
<td valign="middle" align="center">MCC</td>
<td valign="top" align="center">0.6583</td>
<td valign="top" align="center">0.8806</td>
<td valign="top" align="center">0.8639</td>
<td valign="top" align="center">0.8691</td>
<td valign="middle" align="center">0.8180</td>
</tr>
<tr>
<td valign="middle" align="center">T-SNE</td>
<td valign="middle" align="center">ACC</td>
<td valign="top" align="center">0.9455</td>
<td valign="top" align="center">0.9394</td>
<td valign="top" align="center">0.9394</td>
<td valign="top" align="center">0.9394</td>
<td valign="middle" align="center">0.9409</td>
</tr>
<tr>
<td valign="middle" align="center"/>
<td valign="middle" align="center">MCC</td>
<td valign="top" align="center">0.8896</td>
<td valign="top" align="center">0.8779</td>
<td valign="top" align="center">0.8767</td>
<td valign="top" align="center">0.8759</td>
<td valign="middle" align="center">0.8800</td>
</tr>
<tr>
<td valign="middle" align="center">SPA</td>
<td valign="middle" align="center">ACC</td>
<td valign="top" align="center">0.9030</td>
<td valign="top" align="center">0.9091</td>
<td valign="top" align="center">0.9455</td>
<td valign="top" align="center">0.9333</td>
<td valign="middle" align="center">0.9227</td>
</tr>
<tr>
<td valign="middle" align="center"/>
<td valign="middle" align="center">MCC</td>
<td valign="top" align="center">0.8112</td>
<td valign="top" align="center">0.822</td>
<td valign="top" align="center">0.8886</td>
<td valign="top" align="center">0.8664</td>
<td valign="middle" align="center">0.8471</td>
</tr>
<tr>
<td valign="middle" align="center">CARS</td>
<td valign="middle" align="center">ACC</td>
<td valign="top" align="center">0.9394</td>
<td valign="top" align="center">0.9333</td>
<td valign="top" align="center">0.9273</td>
<td valign="top" align="center">0.9394</td>
<td valign="middle" align="center">0.9349</td>
</tr>
<tr>
<td valign="middle" align="center"/>
<td valign="middle" align="center">MCC</td>
<td valign="top" align="center">0.8779</td>
<td valign="top" align="center">0.8639</td>
<td valign="top" align="center">0.8519</td>
<td valign="top" align="center">0.8759</td>
<td valign="middle" align="center">0.8674</td>
</tr>
<tr>
<td valign="middle" align="center">Vegetation indices</td>
<td valign="middle" align="center">ACC</td>
<td valign="top" align="center">0.9152</td>
<td valign="top" align="center">0.8909</td>
<td valign="top" align="center">0.9212</td>
<td valign="top" align="center">0.9333</td>
<td valign="middle" align="center">0.9152</td>
</tr>
<tr>
<td valign="middle" align="center"/>
<td valign="middle" align="center">MCC</td>
<td valign="top" align="center">0.8329</td>
<td valign="top" align="center">0.7867</td>
<td valign="top" align="center">0.8385</td>
<td valign="top" align="center">0.8664</td>
<td valign="middle" align="center">0.8311</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>DeepBGS-based model for classification of barnyard grass and rice at seedling stage</title>
<p>Transforming linear hyperspectral reflectance data into 2D matrix data through subsequence division is crucial for extracting spectral global and local correlation features by DeepBGS. Therefore, our initial focus lies in optimizing the subsequence window length and sliding step length to select appropriate parameters for the DeepBGS model. Through grid optimization grounded in 10-fold cross-validation of the training set, we explored various combinations of window lengths and sliding step lengths within the range of 50-300, with a step length of 50. Previous results have shown that the models achieve the best prediction performance following the preprocessing of original data using SNV. Hence, DeepBGS modeling exclusively relies on SNV preprocessed data, and the 10-fold cross-segmentation of the training set remains consistent across all combinations of window length and sliding step length. The model prediction outcomes across different combinations of window length and sliding step length were visualized in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>. Notably, when the window length is set to 200 and the sliding step length to 150, the DeepBGS model attained its highest training performance, with ACC, MCC, and AUC reaching 0.9979, 0.9958, and 0.9999, respectively.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Effects of various combinations of window length and sliding step size on model performance. <bold>(A&#x2013;C)</bold> show the performance of ACC, MCC, and AUC respectively. The horizontal axis is the step size, and the vertical axis is the window size.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g006.tif"/>
</fig>
<p>Based on the optimal combination of window length and sliding step (<italic>w</italic> = 200, <italic>s</italic> = 150), we further compared the performance of deep convolutional networks for extracting sequence matrix features. As illustrated in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>, <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>, all five deep learning models demonstrate robust capabilities in distinguishing seedling barnyard grass from rice, with ACC surpassing 0.93 and MCC exceeding 0.87. Remarkably, the DeepBGS model emerges as the top performer, achieving a flawless differentiation rate of 98.18%. All 95 barnyard grass samples were correctly classified, with only 3 out of 70 rice samples misclassified as barnyard grass (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). In contrast, the DeepBGS-NoLSTM model, which excludes the LSTM module, experiences a slight reduction in independent test accuracy, primarily observed in the decline of ACC and MCC to 0.9697 and 0.9379. The VGG model, without the batch normalization layer, exhibited a more pronounced decrease in prediction performance, with ACC and MCC plummeting to only 0.9515 and 0.9014, respectively, comparable to traditional machine learning models. And the MLP module attained ACC and MCC scores of 0.9394 and 0.8779. Meanwhile, the Resnet18 model, which featured an 18-layer network, attained ACC and MCC scores of 0.9636 and 0.9256, respectively, underscoring its efficacy in distinguishing between barnyard grass and rice at the seedling stage. However, augmenting the network depth to 50 layers resulted in diminished prediction accuracy for the Resnet50 model, with ACC and MCC declining to 0.9455 and 0.8886, respectively.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Independent test performance of deep learning models.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Evaluation Measures</th>
<th valign="middle" align="center">DeepBGS</th>
<th valign="middle" align="center">DeepBGS-NoLSTM</th>
<th valign="middle" align="center">VGG</th>
<th valign="middle" align="center">Resnet18</th>
<th valign="middle" align="center">Resnet50</th>
<th valign="middle" align="center">MLP</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">ACC</td>
<td valign="middle" align="center">0.9818</td>
<td valign="middle" align="center">0.9697</td>
<td valign="middle" align="center">0.9515</td>
<td valign="middle" align="center">0.9636</td>
<td valign="top" align="center">0.9455</td>
<td valign="middle" align="center">0.9394</td>
</tr>
<tr>
<td valign="middle" align="center">MCC</td>
<td valign="middle" align="center">0.9632</td>
<td valign="middle" align="center">0.9379</td>
<td valign="middle" align="center">0.9014</td>
<td valign="middle" align="center">0.9256</td>
<td valign="top" align="center">0.8886</td>
<td valign="middle" align="center">0.8779</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Training performance of Resnet models with different depths. <bold>(A)</bold> is Resnet18 and <bold>(B)</bold> is Resnet50.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-16-1507442-g007.tif"/>
</fig>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Confusion matrix for the prediction results of the DeepBGS.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" rowspan="2" align="center"/>
<th valign="middle" rowspan="2" align="center"/>
<th valign="middle" colspan="2" align="center">Predicted classes</th>
</tr>
<tr>
<th valign="bottom" align="center">Barnyard grass</th>
<th valign="bottom" align="center">Rice</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">Actual classes</td>
<td valign="bottom" align="center">Barnyard grass</td>
<td valign="bottom" align="center">95</td>
<td valign="bottom" align="center">0</td>
</tr>
<tr>
<td valign="bottom" align="center">Rice</td>
<td valign="bottom" align="center">3</td>
<td valign="bottom" align="center">67</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Controlling barnyard grass is particularly challenging due to its strong resistance to herbicides. Effective control of barnyard grass in the early stages can significantly reduce both economic and environmental costs. Establishing a dependable early identification system for weeds is paramount, with HS emerging as a promising avenue over RGB imaging. Unlike the latter, HS focuses on phytochemical composition indicators rather than solely shape, size, and color, offering distinct advantages (<xref ref-type="bibr" rid="B7">Farooq et&#xa0;al., 2018</xref>). Hyperspectral data furnishes intricate reflectance information across numerous narrow spectral bands. However, grappling with the high redundancy and multicollinearity inherent in these bands presents a formidable obstacle. Extracting actionable insights from such data stands as a pivotal requirement for effective weed early identification. Prior studies, exemplified <xref ref-type="bibr" rid="B28">Zhang et&#xa0;al. (2019)</xref>, have demonstrated promising outcomes utilizing methodologies like the SPA in tandem with weighted SVM models for the identification of barnyard grass, weedy rice, and rice, achieving high recognition rates. In the present study, we employed three feature engineering methods: feature dimensionality reduction, feature selection, and vegetation index conversion. While certain methods like PCA and vegetation index conversion failed to bolster model accuracy, others such as t-SNE for dimensionality reduction and feature selection techniques like CARS and SPA exhibited enhancements in prediction performance. However, achieving accurate differentiation between barnyard grass and rice at the seedling stage remains an ongoing challenge.</p>
<p>This study compares the performance of traditional machine learning models and deep learning methods in identifying barnyard grass and rice at the seedling stage. Unlike traditional approaches, deep learning eliminates the need for complex feature engineering, autonomously extracting meaningful patterns from raw data to achieve superior classification results (<xref ref-type="bibr" rid="B22">Perez-Sanz et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B24">Sari&#x107; et&#xa0;al., 2022</xref>). Although a defining feature of deep learning is that the input data can be unstructured (<xref ref-type="bibr" rid="B19">Murphy et&#xa0;al., 2024</xref>), the non-imaging hyperspectral data in this study is inherently structured. When a simple fully connected network is used, its prediction accuracy reaches 0.9394, comparable to that of traditional machine learning models. To fully capture both local and global associations among hyperspectral bands, we introduce a subsequence conversion method based on sliding windows. This approach transforms the hyperspectral bands from one-dimensional vectors into two-dimensional matrices, enabling them to serve as input for a deep learning model that combines convolutional networks and LSTM. This method leverages the robust feature extraction capabilities of deep learning. Building on the ResNet model, we examined the effect of network depth on model performance and found that excessive depth can lead to overfitting. As shown in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>, the Resnet18 model, despite its lower network depth, achieved stable training results after only 31 rounds of training, with both training ACC and MCC stabilizing at 0.9778 and 0.9556, respectively. In the independent test, the ACC and MCC remained stable at 0.9636 and 0.9256, respectively. Conversely, after 28 rounds of training for the Resnet50 model with increased network depth, although the loss stabilized, the training ACC and MCC reach slightly lower values of 0.9687 and 0.9394, respectively. However, the final independent test performance exhibited more significantly decline, with the ACC and MCC dropping to 0.9455 and 0.8886, respectively. This phenomenon may arise from the limited training data, which makes models with complex network architectures more susceptible to overfitting. Consequently, DeepBGS in this study employs only a 9-layer convolutional module.</p>
<p>This study investigates the hyperspectral characteristics distinction between barnyard grass and rice at the seedling stage and proposes a deep learning-based framework for hyperspectral feature extraction. However, the current approach relies solely on indoor non-imaging methods to extract spectral features, and the limited number of training samples necessitates further work before it can be applied in the field. First, the spectral data from crop canopies in the field are filtered by various factors, such as sunlight, angle, cloud absorption, and shadows, leading to significant differences from the controlled laboratory environment. Therefore, acquiring more field-labeled samples is crucial for enhancing the model&#x2019;s practical applicability. Additionally, transfer learning may offer a solution for developing effective models with limited training data. For real-time weed recognition models deployed in the field, those with lower costs and higher computational efficiency may be preferable, even at the expense of reduced accuracy (<xref ref-type="bibr" rid="B19">Murphy et&#xa0;al., 2024</xref>). Therefore, extending the model to field-based hyperspectral imaging data and using tools such as deep learning important features (DeepLiFT) and class activation mapping (CAM) to enhance the interpretability of deep learning models&#x2014;by identifying key spectral bands&#x2014;could guide the development of more cost-effective multispectral devices, significantly advancing early weed detection technology in the field.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>Barnyard grass resistance to pesticides increases with growth, making early identification and precise control essential for reducing pesticide use and advancing precision agriculture. To address the challenge of distinguishing barnyard grass from rice seedlings at the early growth stage, this study explores hyperspectral imaging for identification. A combined model incorporating multiple spectral preprocessing techniques, feature engineering methods, and traditional machine learning was evaluated, achieving a maximum classification accuracy of 93.94%. Finally, we developed a deep learning-based framework for extracting hyperspectral features, achieving 98.18% accuracy in distinguishing seedling barnyard grass from rice.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: Data will be made available at <uri xlink:href="https://github.com/dejavu1021/DeepBGS">https://github.com/dejavu1021/DeepBGS</uri>.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>ST: Project administration, Resources, Writing &#x2013; review &amp; editing, Funding acquisition. QX: Writing &#x2013; review &amp; editing, Conceptualization, Data curation, Formal analysis, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft. WZ: Writing &#x2013; original draft, Investigation, Resources. YD: Writing &#x2013; review &amp; editing. LZ: Writing &#x2013; review &amp; editing. XY: Investigation, Resources, Writing &#x2013; original draft. ZY: Writing &#x2013; review &amp; editing. YC: Writing &#x2013; review &amp; editing, Project administration, Resources.</p>
</sec>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the&#xa0;research, authorship, and/or publication of this article. This&#xa0;research was supported in part by the National Key R\&amp;D Program of China (2023YFD1401100), Hunan Provincial Key Research and Development Program (2024AQ2035, 2023NK2011), Interdisciplinary Research Youth Guidance Project of Hunan Agricultural University under Grants 2024XKJC04, Provincial Science and Technology Innovation Team (S2021YZCXTD0024), Funding for Changsha Science and Technology Plan Project (kh2303010), the Scientific Research Project of Hunan Provincial Department of Education (21B0187).</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors thank all researchers who contributed to the advancement of science.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amigo</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Grassi</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Configuration of hyperspectral and multispectral imaging systems</article-title>. <source>Data Hand. Sci. Technol.</source> <volume>32</volume>, <fpage>17</fpage>&#x2013;<lpage>34</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-444-63977-6.00002-X</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ara&#xfa;jo</surname> <given-names>M. C. U.</given-names>
</name>
<name>
<surname>Saldanha</surname> <given-names>T. C. B.</given-names>
</name>
<name>
<surname>Galv&#xe3;o</surname> <given-names>R. K. H.</given-names>
</name>
<name>
<surname>Yoneyama</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Chame</surname> <given-names>H. C.</given-names>
</name>
<name>
<surname>Visan</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>The successive projections algorithm for variable selection in spectroscopic multicomponent analysis</article-title>. <source>Chemometr. Intell. Lab.</source> <volume>57</volume>, <fpage>65</fpage>&#x2013;<lpage>73</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0169-7439(01)00119-8</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Belkina</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Ciccolella</surname> <given-names>C. O.</given-names>
</name>
<name>
<surname>Anno</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Halpert</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Spidlen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Snyder-Cappione</surname> <given-names>J. E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Automated optimized parameters for T-distributed stochastic neighbor embedding improve visualization and analysis of large datasets</article-title>. <source>Nat. Commun.</source> <volume>10</volume>, <fpage>5415</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41467-019-13055-y</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bi</surname> <given-names>Y. M.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>K. L.</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>W. Q.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J. Z.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>A local pre-processing method for near-infrared spectra, combined with spectral segmentation and standard normal variate transformation</article-title>. <source>Anal. Chim. Acta</source> <volume>909</volume>, <fpage>30</fpage>&#x2013;<lpage>40</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aca.2016.01.010</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Diao</surname> <given-names>Z. H.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>J. N.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Z. D.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>P. L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Corn seedling recognition algorithm based on hyperspectral image and lightweight-3D-CNN</article-title>. <source>Comput. Election. Agr.</source> <volume>201</volume>, <elocation-id>107343</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107343</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Farooq</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>X. P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Analysis of spectral bands and spatial resolutions for weed classification via deep convolutional neural network</article-title>. <source>IEEE Geosci. Remote S.</source> <volume>16</volume> (<issue>2</issue>), <fpage>183</fpage>&#x2013;<lpage>187</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/LGRS.2018.2869879</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hearst</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Dumais</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Osuna</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Platt</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Scholkopf</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Support vector machines</article-title>. <source>IEEE Intell. Syst. Appl.</source> <volume>13</volume>, <fpage>18</fpage>&#x2013;<lpage>28</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/5254.708428</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>H. S.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>J. Z.</given-names>
</name>
<name>
<surname>Lan</surname> <given-names>Y. B.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>A. Q.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>X. L.</given-names>
</name>
<name>
<surname>Wen</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Accurate weed mapping and prescription map generation based on fully convolutional networks using UAV imagery</article-title>. <source>Sensors-Basel</source> <volume>18</volume>, <elocation-id>3299</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s18103299</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ijomah</surname> <given-names>A. M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Second order regression with two predictor variables centered on mean in an ill conditioned model</article-title>. <source>Int. J. Stat. Appl.</source> <volume>9</volume>, <fpage>101</fpage>&#x2013;<lpage>110</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5923/j.statistics.20190904.01</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamath</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Balachandra</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Prabhu</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Paddy crop and weed discrimination: A multiple classifier system approach</article-title>. <source>Int. J. Agron.</source> <volume>2020</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2020/6474536</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lan</surname> <given-names>Y. B.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>K. H.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>L. C.</given-names>
</name>
<name>
<surname>Ye</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Real-time identification of rice weeds by uav low-altitude remote sensing based on improved semantic segmentation mode</article-title>. <source>Remote Sens.-Basel</source> <volume>13</volume>, <elocation-id>4370</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13214370</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>Y. Z.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Q. S.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>D. S.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Key wavelengths screening using competitive adaptive reweighted sampling method for multivariate calibration</article-title>. <source>Anal. Chim. Acta</source> <volume>648</volume>, <fpage>77</fpage>&#x2013;<lpage>84</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aca.2009.06.046</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y. J.</given-names>
</name>
<name>
<surname>Al-Sarayreh</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Irie</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Hackell</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Bourdot</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Reis</surname> <given-names>M. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Identification of weeds based on hyperspectral imaging and machine learning</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.611622</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>E. Q.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>He</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>X. M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Identification of plant species in an alpine steppe of Northern Tibet using close-range hyperspectral imagery</article-title>. <source>Ecol. Inform.</source> <volume>61</volume>, <elocation-id>101213</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecoinf.2021.101213</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Ying</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Savitzky-Golay smoothing and differentiation filter for even number data</article-title>. <source>Signal Process.</source> <volume>85</volume>, <fpage>1429</fpage>&#x2013;<lpage>1434</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.sigpro.2005.02.002</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>X. W.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H. W.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y. W.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Fully convolutional network for rice seedling and weed image segmentation at the seedling stage in paddy fields</article-title>. <source>PLoS One</source> <volume>14</volume>, <elocation-id>e0215676</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0215676</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mishra</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Asaari</surname> <given-names>M. S. M.</given-names>
</name>
<name>
<surname>Herrero-Langreo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lohumi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Diezma</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Scheunders</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Close range hyperspectral imaging of plants: A review</article-title>. <source>Biosyst. Eng.</source> <volume>164</volume>, <fpage>49</fpage>&#x2013;<lpage>46</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biosystemseng.2017.09.009</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murphy</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Ludwig</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Gutierrez</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Gehan</surname> <given-names>M. A.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Deep learning in image-based plant phenotyping</article-title>. <source>Annu. Rev. Plant Biol.</source> <volume>75</volume>, <fpage>771</fpage>&#x2013;<lpage>795</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev-arplant-070523-042828</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Osman</surname> <given-names>A. I. A.</given-names>
</name>
<name>
<surname>Ahmed</surname> <given-names>A. N.</given-names>
</name>
<name>
<surname>Chow</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y. F.</given-names>
</name>
<name>
<surname>El-Shafie</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Extreme gradient boosting (Xgboost) model to predict the groundwater levels in Selangor Malaysia</article-title>. <source>Ain Shams Eng. J.</source> <volume>12</volume>, <fpage>1545</fpage>&#x2013;<lpage>1556</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.asej.2020.11.011</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>H. X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z. H.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Z. Y.</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>Y. Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Weed detection in paddy field using an improved RetinaNet network</article-title>. <source>Comput. Election. Agr.</source> <volume>199</volume>, <elocation-id>107179</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107179</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perez-Sanz</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Navarro</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Egea-Cortines</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Plant phenomics: An overview of image acquisition technologies and image data analysis algorithms</article-title>. <source>GigaScience</source> <volume>6</volume>, <fpage>1</fpage>&#x2013;<lpage>18</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/gix092</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Riedmiller</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Advanced supervised learning in multi-layer perceptrons&#x2014;from backpropagation to adaptive learning algorithms</article-title>. <source>Comput. Stand. Inter.</source> <volume>16</volume>, <fpage>265</fpage>&#x2013;<lpage>278</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0920-5489(94)90017-5</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sari&#x107;</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Nguyen</surname> <given-names>V. D.</given-names>
</name>
<name>
<surname>Burge</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Berkowitz</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Trt&#xed;lek</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Whelan</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Applications of hyperspectral imaging in plant phenotyping</article-title>. <source>Trends Plant Sci.</source> <volume>27</volume>, <fpage>301</fpage>&#x2013;<lpage>315</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tplants.2021.12.003</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>Y. Y.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Decision tree methods: applications for classification and prediction</article-title>. <source>Shanghai Arch. Psychiatry</source> <volume>27</volume>, <fpage>130</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.11919/j.issn.1002-0829.215044</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Timothy</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Anuradha</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Moving average and autoregressive correlation structures under multivariate skew normality</article-title>. <source>Commun. Stat.-Simul. C.</source> <volume>52</volume> (<issue>1</issue>), <fpage>84</fpage>&#x2013;<lpage>97</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/03610918.2020.1847292</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wold</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Esbensen</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Geladi</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Principal component analysis</article-title>. <source>Chemometr. Intell. Lab.</source> <volume>2</volume>, <fpage>37</fpage>&#x2013;<lpage>52</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0169-7439(87)80084-9</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y. C.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Cen</surname> <given-names>H. Y.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>Y. L.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>X. Y.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Automated spectral feature extraction from hyperspectral images to differentiate weedy rice and barnyard grass from a rice crop</article-title>. <source>Comput. Election. Agr.</source> <volume>159</volume>, <fpage>42</fpage>&#x2013;<lpage>49</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2019.02.0</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>