<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1518205</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2024.1518205</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Classical and machine learning tools for identifying yellow-seeded <italic>Brassica napus</italic> by fusion of hyperspectral features</article-title>
<alt-title alt-title-type="left-running-head">Liu et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2024.1518205">10.3389/fgene.2024.1518205</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Fan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2898473/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Fang</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2426321/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Zaiqi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cao</surname>
<given-names>Liang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Jinran</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1842646/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>You-Gan</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Hunan Provincial Key Laboratory of Dong Medicine</institution>, <institution>Hunan University of Medicine</institution>, <addr-line>Huaihua</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Key Laboratory of Intelligent Computing and Information Processing of Ministry of Education and Hunan Key Laboratory for Computation and Simulation in Science and Engineering</institution>, <institution>Xiangtan University</institution>, <addr-line>Xiangtan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>School of Mathematics and Physics</institution>, <institution>The University of Queensland</institution>, <addr-line>Brisbane</addr-line>, <addr-line>QLD</addr-line>, <country>Australia</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2765209/overview">Zhiqiang Wang</ext-link>, Chengdu Agriculture College, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2082140/overview">Hong Bo</ext-link>, Lushan Botanical Garden (CAS), China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2901583/overview">Mengzhuo Luo</ext-link>, Guilin University of Technology, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2901613/overview">Liang Li</ext-link>, Hunan Institute of Agricultural Information and Engineering, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Fang Wang, <email>fwang4@xtu.edu.cn</email>
</corresp>
<fn fn-type="other" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>ORCID: ; Fan Liu, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0009-0005-8356-5588">orcid.org/0009-0005-8356-5588</ext-link>; Fang Wang, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-4756-719X">orcid.org/0000-0002-4756-719X</ext-link>; Zaiqi Zhang, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0009-0009-8200-8674">orcid.org/0009-0009-8200-8674</ext-link>; Liang Cao, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0009-0005-8300-6428">orcid.org/0009-0005-8300-6428</ext-link>; Jinran Wu, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0002-2388-3614">orcid.org/0000-0002-2388-3614</ext-link>; You-Gan Wang, <ext-link ext-link-type="uri" xlink:href="http://orcid.org/0000-0003-0901-4671">orcid.org/0000-0003-0901-4671</ext-link>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>15</day>
<month>01</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1518205</elocation-id>
<history>
<date date-type="received">
<day>28</day>
<month>10</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>26</day>
<month>12</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2025 Liu, Wang, Zhang, Cao, Wu and Wang.</copyright-statement>
<copyright-year>2025</copyright-year>
<copyright-holder>Liu, Wang, Zhang, Cao, Wu and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Due to its favorable traits-such as lower lignin content, higher oil concentration, and increased protein levels-the genetic improvement of yellow-seeded rapeseed has attracted more attention than other rapeseed color variations. Traditionally, yellow-seeded rapeseed has been identified visually, but the complex variability in the seed coat color of <italic>Brassica napus</italic> has made manual identification challenging and often inaccurate. Another method, using the RGB color system, is frequently employed but is sensitive to photographic conditions, including lighting and camera settings.</p>
</sec>
<sec>
<title>Methods</title>
<p>We present four data-driven models to identify yellow-seeded <italic>B. napus</italic> using hyperspectral features combined with simple yet intelligent techniques. One model employs partial least squares regression (PLSR) to predict the R, G, and B color channels, effectively distinguishing yellow-seeded varieties from others according to globally accepted yellow-seed classification protocols. Another model uses logistic regression (Logit-R) to produce a probability-based assessment of yellow-seeded status. Additionally, we implement two intelligent models, random forest and support vector classifier to evaluate features selected through lasso-penalized logistic regression.</p>
</sec>
<sec>
<title>Results and Discussion</title>
<p>Our findings indicate significant recognition accuracies of 96.55% and 98% for the PLSR and Logit-R models, respectively, aligning closely with the accuracy of previous methods. This approach represents a meaningful advancement in identifying yellow-seeded rapeseed, with high recognition accuracy demonstrating the practical applicability of these models.</p>
</sec>
</abstract>
<kwd-group>
<kwd>rapeseed (Brassica napus)</kwd>
<kwd>yellow-seeded</kwd>
<kwd>hyperspectral feature</kwd>
<kwd>logistic regression</kwd>
<kwd>partial least squares regression</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Genomics of Plants and the Phytoecosystem</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>The quality of life and wellbeing of individuals are deeply influenced by the quality of rapeseed. The global adoption of cultivating &#x201c;double high and double low&#x201d; rapeseed-characterized by high oleic acid and oil content, along with low erucic acid and sulfur glycosides-underscores its vital significance.</p>
<p>During development, rapeseed contains chlorophyll, giving it a green hue. As the seeds mature, they exhibit colors ranging from black and reddish-brown to yellow. The seed coats of black and reddish-brown seeds accumulate pigments, while the transparent seed coats of yellow-seeded varieties reveal the embryo&#x2019;s color. Studies indicate that yellow-seeded rapeseed has a shorter dormancy period, simpler germination, and higher oil content than black-seeded varieties, highlighting the breeding of yellow-seeded rapeseed as a valuable method to enhance oil content (<xref ref-type="bibr" rid="B37">Yang et al., 2021</xref>). Identifying yellow-seeded varieties of <italic>Brassica juncea</italic> and <italic>Brassica campestris</italic> is relatively straightforward, as the pure yellow phenotype is genetically stable (<xref ref-type="bibr" rid="B18">Li et al., 2012</xref>; <xref ref-type="bibr" rid="B7">Chen et al., 2015</xref>). However, stable, pure-yellow progeny have yet to be achieved in <italic>Brassica napus</italic> due to the complexity of seed coat color variations, including hetero-yellow patterns, such as yellow with black spots, patches, or brown rings. Additionally, the seed coat color of segregated progeny shows continuous variation (<xref ref-type="bibr" rid="B13">Liu, 1992</xref>; <xref ref-type="bibr" rid="B1">Auger et al., 2010</xref>; <xref ref-type="bibr" rid="B30">Qu et al., 2013</xref>). Consequently, accurately and efficiently determining the seed coat color of <italic>B. napus</italic> remains a critical and challenging task. Numerous studies address the identification of rapeseed color (<xref ref-type="bibr" rid="B16">Li et al., 2001</xref>; <xref ref-type="bibr" rid="B33">Somers et al., 2001</xref>; <xref ref-type="bibr" rid="B42">Zhang et al., 2006</xref>; <xref ref-type="bibr" rid="B2">Baetzel et al., 2003</xref>; <xref ref-type="bibr" rid="B34">Ta&#x144;ska et al., 2005</xref>; <xref ref-type="bibr" rid="B38">Li et al., 2012</xref>; <xref ref-type="bibr" rid="B23">Liu et al., 2005</xref>; <xref ref-type="bibr" rid="B29">Ye et al., 2018</xref>). For example, <xref ref-type="bibr" rid="B16">Li et al. (2001)</xref> estimated the yellow-seeded degree of <italic>B. napus</italic> through visual observation, a straightforward method but heavily reliant on the observer, leading to potentially inaccurate recognition. <xref ref-type="bibr" rid="B33">Somers et al. (2001)</xref> utilized light reflection to assess yellow-seeded color grade by measuring reflectance values and calculating the grain color index or light reflection values. While this method is more objective, it captures only single-dimensional color data, such as brightness, omitting rich information in the original material. To address this limitation, many scholars have focused on digital image analysis through the RGB color system (<xref ref-type="bibr" rid="B42">Zhang et al., 2006</xref>; <xref ref-type="bibr" rid="B2">Baetzel et al., 2003</xref>; <xref ref-type="bibr" rid="B34">Ta&#x144;ska et al., 2005</xref>; <xref ref-type="bibr" rid="B38">Li et al., 2012</xref>; <xref ref-type="bibr" rid="B23">Liu et al., 2005</xref>; <xref ref-type="bibr" rid="B29">Ye et al., 2018</xref>). However, the complex and similar coloration of the rapeseed epidermis makes precise color identification challenging, and the available techniques lack reliability and standardization. Accurate and efficient color measurement of yellow-seeded <italic>B. napus</italic> thus remains essential.</p>
<p>Recent advancements in chemometrics and computer technology have led to the development of near-infrared spectroscopy (NIRS), a technique combining both image and spectral data of the object. NIRS, known for its speed, non-destructive nature, and high efficiency, is widely used for the rapid, non-destructive analysis of agricultural products. Several studies have demonstrated its utility (<xref ref-type="bibr" rid="B10">Guo et al., 2019</xref>; <xref ref-type="bibr" rid="B6">Bu et al., 2023</xref>; <xref ref-type="bibr" rid="B19">Liang et al., 2023</xref>; <xref ref-type="bibr" rid="B21">Liu et al., 2021</xref>; <xref ref-type="bibr" rid="B27">Petisco et al., 2010</xref>; <xref ref-type="bibr" rid="B31">Sen et al., 2018</xref>; <xref ref-type="bibr" rid="B22">Liu et al., 2022</xref>; <xref ref-type="bibr" rid="B40">Zhang et al., 2020</xref>; <xref ref-type="bibr" rid="B36">Wei et al., 2020</xref>; <xref ref-type="bibr" rid="B41">Zhang et al., 2018</xref>; <xref ref-type="bibr" rid="B15">Jiang et al., 2017</xref>; <xref ref-type="bibr" rid="B17">Li et al., 2022</xref>; <xref ref-type="bibr" rid="B14">Jiang et al., 2018</xref>; <xref ref-type="bibr" rid="B11">He et al., 2022</xref>). For instance, <xref ref-type="bibr" rid="B10">Guo et al. (2019)</xref> used an NIRS imaging system (380&#x2013;1,000&#xa0;nm) to accurately quantify adulterated rice, while <xref ref-type="bibr" rid="B6">Bu et al. (2023)</xref> combined hyperspectral imaging with convolutional neural networks to create an intelligent model for sorghum variety recognition, surpassing existing models in accuracy. This technology has also been applied in rapeseed growth diagnostics. For example, <xref ref-type="bibr" rid="B21">Liu et al. (2021)</xref> developed a hyperspectral technique-based detection algorithm to predict the oleic acid content in <italic>B. napus</italic>. <xref ref-type="bibr" rid="B27">Petisco et al. (2010)</xref> examined visible and near-infrared spectra of <italic>B. napus</italic> and <italic>B. juncea</italic> with different oil levels, and <xref ref-type="bibr" rid="B22">Liu et al. (2022)</xref> developed an intelligent model that identified eleven <italic>B. napus</italic> varieties by integrating hyperspectral and spectral data, achieving a recognition accuracy of 93.71%. In another study, <xref ref-type="bibr" rid="B36">Wei et al. (2020)</xref> achieved 99.2% accuracy in classifying 15 soybean varieties through hyperspectral imaging, while <xref ref-type="bibr" rid="B17">Li et al. (2022)</xref> improved oleic acid content inversion in <italic>B. napus</italic> seeds by reducing hyperspectral redundancy.</p>
<p>As noted, identifying yellow-seeded <italic>B. napus</italic> is challenging due to the small seed size and complex seed coat color. Inconsistent RGB standards and labor-intensive calibration further complicate the task. The successful integration of hyperspectral technology in agriculture has paved the way for advancements in digital farming, inspiring us to apply it for yellow-seed identification. Furthermore, combining hyperspectral features with machine learning enhances remote sensing applications in smart agriculture, with hyperspectral analysis proving effective for modeling rapeseed aliphatic acid content. Hyperspectral sensing, a form of near-Earth remote sensing, provides a foundation for satellite- or drone-based agricultural monitoring. This technology facilitates tasks such as classification and inversion of land object parameters, which are challenging for traditional vision-based systems. Thus, our early-stage near-Earth remote sensing experiments are pivotal for advancing agricultural monitoring techniques.</p>
<p>In this study, we propose a novel approach to identifying yellow-seeded <italic>B. napus</italic> using hyperspectral imaging technology. We combine trilateral parameters derived from hyperspectral rapeseed imaging with spectral indices, applying partial least squares regression, logistic regression, random forest, and support vector classifiers. Importantly, the simplicity of spectral data collection addresses RGB calibration limitations. These intelligent models exhibit a commendable level of recognition accuracy. This study represents an initial exploration into rapeseed color classification through hyperspectral technology and machine learning, underscoring the significant potential of hyperspectral technology in tasks traditionally reliant on human vision systems.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Methods and materials</title>
<sec id="s2-1">
<title>2.1 Materials</title>
<p>For this study, we used two high oleic acid rapeseed varieties, namely, Xiangyou 708 and Xiangyou 710 (<italic>B. napus. L</italic>). These varieties were cultivated in the paddy fields of Yunyuan Experimental Base (28&#xb0;23&#x2032;N, 112&#xb0;93&#x2032;E, as illustrated in <xref ref-type="fig" rid="F1">Figures 1A, B</xref>) located in Changsha City, Hunan Province, China. The region is situated in a subtropical monsoon climate, characterized by warm winters, hot summers, abundant rainfall primarily concentrated in the summer months, and distinct four seasons with relatively balanced seasonal distribution. In Changsha, the seasonal pattern features longer summers and winters, while spring and autumn are relatively shorter. And the average annual temperature is 17.2&#xb0;C, the accumulated annual temperature is approximately 5,457&#xb0;C, and the average yearly precipitation is 1361.6&#xa0;mm. The crop rotation scheme involved black loam soil with rice as the preceding crop. Planting occurred in September 2020, with harvesting in April 2021.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Location of the study area and hyperspectral collection environment. <bold>(A)</bold> Study area location in Changsha City, China; <bold>(B)</bold> Satellite map of Yunyuan Experimental Base (highlighted in red); <bold>(C)</bold> Hyperspectral data acquisition setup; <bold>(D)</bold> Region of Interest (ROI) for rapeseed sample.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g001.tif"/>
</fig>
<p>
<bold>Remark 1:</bold> This study represents a preliminary exploration into color classification of rapeseed seeds through integrating hyperspectral technology and machine learning methods. Recognizing the attributes of yellow-seeded varieties-such as high oil content, elevated polyphenol levels, enhanced nutritional value, and precise harvest time determination-we aim to employ the proposed model for identifying yellow-seeded rapeseed. Accordingly, we focus on the established varieties Xiangyou 708 and Xiangyou 710, which have been widely cultivated and promoted in Hunan Province, China.</p>
</sec>
<sec id="s2-2">
<title>2.2 Data collection</title>
<p>We utilized the SOC710 portable hyperspectral imager (wavelength range: 380&#x2013;1,091&#xa0;nm; resolution: 4.9458&#xa0;nm) along with its darkroom system, manufactured by Surface Optics Corporation, United States, to collect spectral data. The optical obscura, as shown in <xref ref-type="fig" rid="F1">Figure 1C</xref>, was maintained in dark conditions. Measuring <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mn>50</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>60</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>120</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> <inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mtext>cm</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, the obscura featured a movable base, a cooling device, and diffusely reflective coating inside. Equipped with a large and small task silo, a lifting table, and four groups of 70W halogen light sources adjustable in position, the spectrometer was mounted at the top small silo with a vertical lens at a distance of 370&#xa0;mm from the rapeseed samples. A total of 300 rapeseed samples were selected (see <xref ref-type="fig" rid="F1">Figure 1D</xref>), and each seed&#x2019;s spectral reflectance was measured five times randomly, with the average taken as the sample reflectance. Additionally, the RGB color information of each sample was recorded.</p>
</sec>
<sec id="s2-3">
<title>2.3 Methods and indicators</title>
<p>Feature selection and modeling method are the key components of our seed identification model. First, the spectral index is commonly used as a reliable indicator in crop remote sensing for seed quality assessment. It enhances crop spectral information while effectively reducing noise and environmental interference by combining two or more spectral reflectances. Spectral indices provide rich data on rapeseed (<xref ref-type="bibr" rid="B39">Zhang et al., 2017</xref>; <xref ref-type="bibr" rid="B12">Hong et al., 2019</xref>; <xref ref-type="bibr" rid="B3">Bai et al., 2022</xref>). In this study, we employ three indices-ratio spectral index (RSI), difference spectral index (DSI), and normalized spectral index (NDSI), calculated for wavelengths 400&#x2013;1,000&#xa0;nm:<disp-formula id="e1">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>
<disp-formula id="e2">
<mml:math id="m4">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>DSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>and<disp-formula id="e3">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
</p>
<p>We also consider trilateral parameters-covering blue (490&#x2013;530&#xa0;nm), yellow (560&#x2013;640&#xa0;nm), and red (680&#x2013;760&#xa0;nm) edges-as additional hyperspectral features containing vital rapeseed information. Our study includes 23 representative parameters (see <xref ref-type="table" rid="T1">Table 1</xref>) encompassing characteristics such as location, amplitude, area, normalization, ratios, and numerical attributes (<xref ref-type="bibr" rid="B26">Peng et al., 2020</xref>; <xref ref-type="bibr" rid="B32">Sibanda et al., 2019</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Hyperspectral trilateral characteristic parameter calculation formulas.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Name</th>
<th align="left">Description or calculation</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Db</td>
<td align="left">Spectral maximum value of first derivative in blue edge (490&#x2013;530&#xa0;nm)</td>
</tr>
<tr>
<td align="left">BDb</td>
<td align="left">Bands corresponding to maximum first derivative value in blue edge</td>
</tr>
<tr>
<td align="left">SDb</td>
<td align="left">Square of blue edge: integration of first derivative over blue edge range</td>
</tr>
<tr>
<td align="left">Dbmin</td>
<td align="left">Minimum first derivative value in blue edge</td>
</tr>
<tr>
<td align="left">NDb</td>
<td align="left">Normalized blue-edge index, (Db-Dbmin)/(Db &#x2b; Dbmin)</td>
</tr>
<tr>
<td align="left">Dy</td>
<td align="left">Spectral maximum value of first derivative in yellow edge (560&#x2013;640&#xa0;nm)</td>
</tr>
<tr>
<td align="left">BDy</td>
<td align="left">Bands corresponding to maximum first derivative value in yellow edge</td>
</tr>
<tr>
<td align="left">SDy</td>
<td align="left">Square of yellow edge: integration of first derivative over yellow edge range</td>
</tr>
<tr>
<td align="left">Dymin</td>
<td align="left">Minimum first derivative value in yellow edge</td>
</tr>
<tr>
<td align="left">NDy</td>
<td align="left">Normalized yellow-edge index, (Dy-Dymin)/(Dy &#x2b; Dymin)</td>
</tr>
<tr>
<td align="left">Dr</td>
<td align="left">Spectral maximum value of first derivative in red edge (680&#x2013;760&#xa0;nm)</td>
</tr>
<tr>
<td align="left">BDr</td>
<td align="left">Bands corresponding to maximum first derivative value in red edge</td>
</tr>
<tr>
<td align="left">SDr</td>
<td align="left">Square of red edge: integration of first derivative over red edge range</td>
</tr>
<tr>
<td align="left">Drmin</td>
<td align="left">Minimum first derivative value in red edge</td>
</tr>
<tr>
<td align="left">NDr</td>
<td align="left">Normalized red-edge index, (Dr-Drmin)/(Dr &#x2b; Drmin)</td>
</tr>
<tr>
<td align="left">Srb</td>
<td align="left">SDr/SDb</td>
</tr>
<tr>
<td align="left">Sry</td>
<td align="left">SDr/SDy</td>
</tr>
<tr>
<td align="left">Syb</td>
<td align="left">SDy/SDb</td>
</tr>
<tr>
<td align="left">NBDb</td>
<td align="left">(SDr-SDb)/(SDr &#x2b; SDb)</td>
</tr>
<tr>
<td align="left">Nry</td>
<td align="left">(SDr-SDy)/(SDr &#x2b; SDy)</td>
</tr>
<tr>
<td align="left">Nby</td>
<td align="left">(SDb-SDy)/(SDb &#x2b; SDy)</td>
</tr>
<tr>
<td align="left">Kur</td>
<td align="left">Kurtosis of red-edge first derivative curve</td>
</tr>
<tr>
<td align="left">Ske</td>
<td align="left">Skewness of red-edge first derivative curve</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>These spectral indicators provide crucial information for characterizing seed color and are thus used in feature combinations for modeling.</p>
<p>To enable effective yellow-seeded rapeseed identification, we employ two well-established mathematical models. First, partial least squares regression (PLSR) (<xref ref-type="bibr" rid="B24">Meacham-Hensold et al., 2019</xref>) combines advantages of multiple linear regression, principal component analysis, and conventional correlation analysis and is commonly applied in spectral research. PLSR creates a linear regression model by projecting independent and response variables into a new space. Here, we use PLSR to predict the values of the three color channels [red (R), green (G), and blue (B)] for differentiating yellow-seeded from non-yellow-seeded rapeseeds.</p>
<p>Additionally, since generalized linear regression is suited for dichotomous classification, we apply logistic regression (Logit-R) to distinguish yellow from non-yellow-seeded rapeseed. The Logit-R model, a widely used machine learning technique, derives prediction parameters from training data and uses these to calculate a data segmentation hyperplane for classification (<xref ref-type="bibr" rid="B5">Broeckx et al., 2018</xref>; <xref ref-type="bibr" rid="B20">Lin et al., 2014</xref>; <xref ref-type="bibr" rid="B25">Munshi et al., 2014</xref>).</p>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>3 Results and discussion</title>
<sec id="s3-1">
<title>3.1 Model preparation</title>
<sec id="s3-1-1">
<title>3.1.1 Labeling of yellow-seeded rapeseed samples</title>
<p>To classify the yellow and non-yellow rapeseed samples, we first labeled the 300 seed samples as yellow or non-yellow. This classification was based on internationally recognized guidelines using R, G, and B color channel thresholds (<xref ref-type="bibr" rid="B42">Zhang et al., 2006</xref>; <xref ref-type="bibr" rid="B2">Baetzel et al., 2003</xref>; <xref ref-type="bibr" rid="B34">Ta&#x144;ska et al., 2005</xref>), defined as follows:<disp-formula id="e4">
<mml:math id="m6">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>0</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>R</mml:mi>
<mml:mo>&#x2209;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>R</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mn>164.1</mml:mn>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>245.3</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
<disp-formula id="e5">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>0</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>G</mml:mi>
<mml:mo>&#x2209;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>G</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mn>101.1</mml:mn>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>226.2</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
<disp-formula id="e6">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>0</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>B</mml:mi>
<mml:mo>&#x2209;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>B</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mn>9.1</mml:mn>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mn>92.2</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>and<disp-formula id="e7">
<mml:math id="m9">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2229;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2229;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mtext>otherwise</mml:mtext>
<mml:mspace width="1em"/>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo>&#x2208;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
<mml:mspace width="1em"/>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>Here, <inline-formula id="inf3">
<mml:math id="m10">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> signifies yellow-seeded, while <inline-formula id="inf4">
<mml:math id="m11">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> denotes non-yellow-seeded. This labeling process resulted in 103 yellow-seeded and 197 non-yellow-seeded samples. <xref ref-type="table" rid="T2">Table 2</xref> summarizes the RGB statistics for the 300 samples.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Statistical characteristics of R/G/B values.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center"/>
<th rowspan="2" align="center">Number of Samples</th>
<th colspan="2" align="center">Red value</th>
<th colspan="2" align="center">Green value</th>
<th colspan="2" align="center">Blue value</th>
</tr>
<tr>
<th align="center">Mean</th>
<th align="center">Std.</th>
<th align="center">Mean</th>
<th align="center">Std.</th>
<th align="center">Mean</th>
<th align="center">Std.</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Yellow</td>
<td align="center">103</td>
<td align="center">202.786</td>
<td align="center">16.737</td>
<td align="center">135.796</td>
<td align="center">17.443</td>
<td align="center">63.747</td>
<td align="center">6.065</td>
</tr>
<tr>
<td align="center">Non-yellow</td>
<td align="center">197</td>
<td align="center">118.426</td>
<td align="center">31.735</td>
<td align="center">79.061</td>
<td align="center">9.63</td>
<td align="center">63.035</td>
<td align="center">6.673</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-1-2">
<title>3.1.2 Spectral index feature extraction</title>
<p>The spectral indices in <xref ref-type="disp-formula" rid="e1">Equations 1</xref>&#x2013;<xref ref-type="disp-formula" rid="e3">3</xref> capture various aspects of hyperspectral information. Selecting optimal band combinations is critical to obtaining the three spectral indices that best represent the red, green, and blue color information. A correlation analysis was conducted between the spectral indices and RGB values, with half of the samples used to distinguish between training and test sets, with 100 independent repetitions to minimize random noise effects. The highest average correlation coefficients for each spectral index, along with corresponding band combinations, are shown in <xref ref-type="table" rid="T3">Table 3</xref>. <xref ref-type="fig" rid="F2">Figure 2</xref> illustrates one of the implementations.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Most correlated bands for spectral index.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Spectral Index</th>
<th colspan="2" align="center">Red value</th>
<th colspan="2" align="center">Green value</th>
<th colspan="2" align="center">Blue value</th>
</tr>
<tr>
<th align="center">
<inline-formula id="inf5">
<mml:math id="m12">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">CC</th>
<th align="center">
<inline-formula id="inf6">
<mml:math id="m13">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">CC</th>
<th align="center">
<inline-formula id="inf7">
<mml:math id="m14">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</th>
<th align="center">CC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">RSI</td>
<td align="center">(705, 910)</td>
<td align="center">
<inline-formula id="inf8">
<mml:math id="m15">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9673</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(582, 983)</td>
<td align="center">
<inline-formula id="inf9">
<mml:math id="m16">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9278</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(534, 571)</td>
<td align="center">
<inline-formula id="inf10">
<mml:math id="m17">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.4449</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">DSI</td>
<td align="center">(418, 610)</td>
<td align="center">
<inline-formula id="inf11">
<mml:math id="m18">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9165</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(421, 536)</td>
<td align="center">-<inline-formula id="inf12">
<mml:math id="m19">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9440</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(419, 994)</td>
<td align="center">-<inline-formula id="inf13">
<mml:math id="m20">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.4068</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">NDSI</td>
<td align="center">(646, 995)</td>
<td align="center">
<inline-formula id="inf14">
<mml:math id="m21">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9660</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(568, 988)</td>
<td align="center">
<inline-formula id="inf15">
<mml:math id="m22">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.9380</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">(531, 571)</td>
<td align="center">
<inline-formula id="inf16">
<mml:math id="m23">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mn>0.4563</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>&#x2a;&#x2a;significance at 0.01 level.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Correlation analysis between spectral indices and RGB values. Each heatmap highlights the highest correlation coefficient with an arrow. The top panels (label 1), middle panels (label 2) and bottom panels (label 3) denote R-value; 2 G-value; 3 B-value, respectively. <bold>(A)</bold> RSI; <bold>(B)</bold> DSI; <bold>(C)</bold> NDSI.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g002.tif"/>
</fig>
</sec>
<sec id="s3-1-3">
<title>3.1.3 Trilateral parameter feature extraction</title>
<p>We also performed a correlation analysis between trilateral parameters and RGB color channels. A random selection of 150 samples with 100 repetitions was used. <xref ref-type="fig" rid="F3">Figure 3</xref> displays the absolute average correlation coefficients of the 23 trilateral parameters with red, green, and blue channels. For the red channel, the top three parameters are Nrb, Srb, and SDb, which are identical to those for the green channel. For the blue channel, the top three are Sry, Nry, and Dr, with lower correlation coefficients than the red and green channels but significant at the 0.01 level.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Absolute correlation coefficients between trilateral parameters and color channels. <bold>(A)</bold> Red channel, <bold>(B)</bold> Green channel, <bold>(C)</bold> Blue channel. Error bars represent standard deviations from 100 repetitions. &#x2a; and &#x2a;&#x2a; denote significance at the 0.05 and 0.01 levels, respectively.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g003.tif"/>
</fig>
<p>Based on the above correlation analysis, we identified optimal feature parameters for each channel. We subsequently combined the three spectral indices with the top three trilateral parameters to create feature sets for predicting the RGB values of test samples.</p>
</sec>
</sec>
<sec id="s3-2">
<title>3.2 Modeling of rapeseed yellow-seeded identification</title>
<p>In this subsection, we establish four yellow-seed identification models by using PLSR, Logistic regression (Logit-R), and two machine learning methods, i.e., support vector classifier (SVC) and random forest. In each model, the 300 samples are randomly divided into two groups, namely, <inline-formula id="inf17">
<mml:math id="m24">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> training samples and <inline-formula id="inf18">
<mml:math id="m25">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>300</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> test samples, where <inline-formula id="inf19">
<mml:math id="m26">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> varies from 150 to 240 with step size 10. We train the models by the samples in the training set and test the model on the test set. In practice, we first input the feature combination of three spectral indexes and top-three trilateral parameters of the <inline-formula id="inf20">
<mml:math id="m27">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> training samples and the corresponding labeled yellow or non-yellow seeded (values of R/G/B or <italic>Y</italic>) to train the modes. Then, the feature combination of the <inline-formula id="inf21">
<mml:math id="m28">
<mml:mrow>
<mml:mn>300</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> test samples is input into the trained model to predict the result. In the end, the recognition accuracy (RA) is calculated according to the predicted results and the labeled results. To eliminate the interference of random noise, the above process is repeated 100 times to acquire the average RA.</p>
<sec id="s3-2-1">
<title>3.2.1 Predication modeling based on PLSR</title>
<p>According to the corn idea of PLSR, the arguments can be input into the model directly regardless of whether multi-collinearity or not. Therefore, we use the six parameters (the three spectral indexes and the top three trilateral parameters) of training samples and the corresponding R/G/B values to train the PLSR model first (constructing regression model to estimate the values of red, green, and blue, denoted by <inline-formula id="inf22">
<mml:math id="m29">
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf23">
<mml:math id="m30">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>, respectively). Taking the <inline-formula id="inf24">
<mml:math id="m31">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>150</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (it means there are randomly chosen 150 training samples and 150 test samples) as an example, the regression estimation is,<disp-formula id="e8">
<mml:math id="m32">
<mml:mrow>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mn>192.76</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>6.64</mml:mn>
<mml:mtext>SDb</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>29.05</mml:mn>
<mml:mtext>Srb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>10.63</mml:mn>
<mml:mtext>Nrb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>75.79</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>705,910</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mo>&#x2b;</mml:mo>
<mml:mn>126.53</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>DSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>418,610</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>130.96</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>646,995</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mn>171.39</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>33.79</mml:mn>
<mml:mtext>SDb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>13.69</mml:mn>
<mml:mtext>Srb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>23.13</mml:mn>
<mml:mtext>Nrb</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>90.19</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>583,983</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mo>&#x2b;</mml:mo>
<mml:mn>104.84</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>DSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>421,536</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>148.18</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>568,988</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mn>45.53</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.69</mml:mn>
<mml:mtext>SDb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.41</mml:mn>
<mml:mtext>Srb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.09</mml:mn>
<mml:mtext>Nrb</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>4.65</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>534,571</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mo>&#x2212;</mml:mo>
<mml:mn>11.79</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>DSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>419,994</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>7.04</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>531,571</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
<mml:mspace width="0.3333em"/>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
</p>
<p>
<bold>Remark 2.</bold> Here, we approached false positives and false negatives with equal consideration. It is indeed accurate to acknowledge that lower error rates can also bring significant losses due to distinct economic implications associated with false negatives and false positives. Moving forward, we plan to enhance our color identification model by incorporating the economic impact of oil content.</p>
<p>Next, the same arguments of the 150 test samples are input into <xref ref-type="disp-formula" rid="e8">Equation 8</xref> to inverse the R, G, and B values respectively. The predicted values and the labeled results are shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. The blue values locate a relatively narrow range compared to the red and green values, but they are all around the theoretical line of <inline-formula id="inf25">
<mml:math id="m33">
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>Y</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Comparison of predicted value and observed value of R, G, and B. The black solid line denotes the theoretical <inline-formula id="inf26">
<mml:math id="m34">
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>Y</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g004.tif"/>
</fig>
<p>Then, using the predicted values of R/G/B, the test samples can be classified into yellow-seeded and non-yellow-seeded according to <xref ref-type="disp-formula" rid="e4">Equations 4</xref>&#x2013;<xref ref-type="disp-formula" rid="e7">7</xref>. <xref ref-type="table" rid="T4">Table 4</xref> shows the confusion matrix for two different numbers of training samples, <inline-formula id="inf27">
<mml:math id="m35">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>150</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (150 test samples) and <inline-formula id="inf28">
<mml:math id="m36">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>240</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (60 test samples), respectively. The small number of misclassified samples is satisfactory.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>The identification results on the test set based on PLSR.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">150 samples</th>
<th align="center">Yellow</th>
<th align="center">Non-yellow</th>
<th align="center">60 samples</th>
<th align="center">Yellow</th>
<th align="center">Non-yellow</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">Yellow</td>
<td align="center">45</td>
<td align="center">6</td>
<td align="center">Yellow</td>
<td align="center">21</td>
<td align="center">1</td>
</tr>
<tr>
<td align="center">Non-yellow</td>
<td align="center">4</td>
<td align="center">95</td>
<td align="center">Non-yellow</td>
<td align="center">1</td>
<td align="center">37</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Varying <inline-formula id="inf29">
<mml:math id="m37">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> from 150 to 240, the RA of yellow-seeded, non-yellow-seeded, and mixed are calculated on the test set. As seen from <xref ref-type="fig" rid="F5">Figure 5</xref>, the RA of the non-yellow-seeded is higher than that of the yellow-seeded. Naturally, the average RA tends to increase with the increase of training samples, however, it is located in the narrow interval of (92.32%, and 96.55%), which confirms the PLSR-based model with fusion feature of spectral index and trilateral parameters is workable.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Recognition accuracy based on the PLSR model.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g005.tif"/>
</fig>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Recognition modeling based on Logit-R</title>
<p>Similar to the PLSR model, we first use the fusion feature and the corresponding labeled seed attribute of training samples to train the Logit-R model. Then, the fusion feature of the test samples is input into the trained model to predict the discriminant probability and further calculate the classification accuracy. What&#x2019;s different from the PLSR model is the label of seed attribute is a Boolean variable of <inline-formula id="inf30">
<mml:math id="m38">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (denotes yellow-seeded) and <inline-formula id="inf31">
<mml:math id="m39">
<mml:mrow>
<mml:mi>Y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> (denotes non-yellow-seeded). To compare the model performance brought by the spectral index and trilateral parameters, the two kinds of features are input into the model respectively. To do so, the three spectral indexes and top-three trilateral parameters related to the highest correlation coefficient for the R/G/B channels are used as feature combinations, respectively to calculate the RA, as shown in <xref ref-type="fig" rid="F6">Figure 6</xref>. In the Logit-R model, the regular coefficient is set at 0.2, the maximum iterations are set at 300, the learning rate is set at 0.01, and the threshold is set at 0.5. As seen in <xref ref-type="fig" rid="F6">Figure 6</xref>, the RA obtained from the spectral index fusion for the green channel and the trilateral parameters for the blue channel is comparatively low. However, using the fusion feature of the three spectral indexes based on the red channel can reach as high as 98% RA, which is higher than other fusion features significantly, even higher than the result from the six-feature fusion based on the PLSR model. In addition, the high RA is regardless of the number of training samples. In this regard, the three-spectral index fusion for the red channel based on Logit-R is suggested to identify the rapeseed yellow seeded.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>The recognition accuracy brought from R, G, and B channels based on different fusion features. <bold>(A)</bold> is spectral index combination and <bold>(B)</bold> is trilateral parameters combination.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g006.tif"/>
</fig>
<p>Following, let&#x2019;s show how the Logit-R model using three-spectral indexes combination <inline-formula id="inf32">
<mml:math id="m40">
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>705,910</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>DSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>418,610</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>NDSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>646,995</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> for classifying the yellow and non-yellow seeded. Taking <inline-formula id="inf33">
<mml:math id="m41">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>150</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> as an example. Before that, we placed the randomly selected 150 test samples in the three-dimensional space constructed by the above spectral indexes, as shown in <xref ref-type="fig" rid="F7">Figure 7</xref>. The yellow-seeded and non-yellow-seeded are clustered together visually, respectively and separated from each other.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Two-classification of the yellow and non-yellow-seeded samples based on the feature combination <inline-formula id="inf34">
<mml:math id="m42">
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>705,910</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>DSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>418,610</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>NDSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>646,995</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g007.tif"/>
</fig>
<p>Now, we hope to find a segmentation hyperplane to separate the above two types of samples. To do so, firstly, we input the remaining 150 samples including the spectral index combination and the corresponding labeled Y &#x3d; 0/1 to train the Logit-R model. The trained discriminant function is<disp-formula id="equ1">
<mml:math id="m43">
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>exp</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>3.3589</mml:mn>
<mml:mtext>RSI</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>4.3883</mml:mn>
<mml:mtext>DSI</mml:mtext>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5.1165</mml:mn>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>Then, inputting the three-spectral indexes combination of the 150 remaining samples into the trained model. <xref ref-type="fig" rid="F7">Figure 7</xref> depicts the sample distribution of four categories: yellow-seeded (yellow dots), non-yellow-seeded (grey squares), misclassified yellow-seeded samples (red dots), and misclassified non-yellow-seeded (red squares). As seen in <xref ref-type="fig" rid="F8">Figure 8</xref>, there are only one yellow sample is misclassified and 9 non-yellow samples are misclassified. The RA of yellow-seeded and non-yellow-seeded is 97.78% and 91.43%, respectively, and the average RA is 93.33%.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>The classification of the yellow and non-yellow-seeded samples based on the feature combination <inline-formula id="inf35">
<mml:math id="m44">
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:mtext>RSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>705,910</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>DSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>418,610</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>NDSI</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>646,995</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g008.tif"/>
</fig>
</sec>
<sec id="s3-2-3">
<title>3.2.3 Predication results with machine learning methods</title>
<p>In this section, we employ two machine learning techniques: random forest <xref ref-type="bibr" rid="B4">Breiman (2001)</xref> and support vector classifier (SVC) <xref ref-type="bibr" rid="B28">Pisner and Schnyer (2020)</xref> to perform a classification task aimed at identifying the yellow seed. Differing from the preceding feature selection methods, we enhance our feature pool by integrating the original hyperspectral reflectances, consisting of nine spectral indexes calculated according to <xref ref-type="table" rid="T3">Table 3</xref>, and 23 trilateral parameters. This augmentation results in a total of 633 features.</p>
<p>To extract pivotal attributes and eliminate redundant data, we employ lasso-penalized logistic regression with the R package &#x2018;glmnet&#x2019; (<xref ref-type="bibr" rid="B9">Friedman et al., 2010</xref>). The parameter <inline-formula id="inf36">
<mml:math id="m45">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, which balances the penalty and loss terms, is fine-tuned to maximize the &#x201c;auc&#x201d; index. Upon tuning, <inline-formula id="inf37">
<mml:math id="m46">
<mml:mrow>
<mml:mi>&#x3bb;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is set at 0.0062. Consequently, we identified 10 key features out of the initial 633. These features include the original hyperspectral values at wavelengths 394, 415, 416, 417, and 418, <inline-formula id="inf38">
<mml:math id="m47">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>NDSI</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>568,988</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> (a spectral index), as well as Yep, Dymin, SDr, and ske (trilateral parameters).</p>
<p>According to these selected ten features, we conduct random forest and support vector classifier algorithms via R packages &#x2018;rpart&#x2019; (<xref ref-type="bibr" rid="B35">Therneau et al., 2015</xref>) and &#x2018;e1071&#x2019; (<xref ref-type="bibr" rid="B8">Meyer et al., 2024</xref>), respectively, by default settings with different training sizes (M: 150&#x2013;240). The prediction results in test sets for the recognition task are reported in <xref ref-type="table" rid="T5">Table 5</xref>.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Results of recognition accuracies with machine learning methods.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="center">Training size M</th>
<th colspan="3" align="center">Random forest</th>
<th colspan="3" align="center">Support vector classifier</th>
</tr>
<tr>
<th align="center">Average</th>
<th align="center">Non-yellow</th>
<th align="center">Yellow</th>
<th align="center">Average</th>
<th align="center">Non-yellow</th>
<th align="center">Yellow</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">150</td>
<td align="center">96.52%</td>
<td align="center">98.31%</td>
<td align="center">93.25%</td>
<td align="center">97.99%</td>
<td align="center">99.25%</td>
<td align="center">95.68%</td>
</tr>
<tr>
<td align="center">160</td>
<td align="center">96.56%</td>
<td align="center">98.23%</td>
<td align="center">93.52%</td>
<td align="center">97.87%</td>
<td align="center">99.18%</td>
<td align="center">95.50%</td>
</tr>
<tr>
<td align="center">170</td>
<td align="center">96.65%</td>
<td align="center">98.42%</td>
<td align="center">93.49%</td>
<td align="center">97.98%</td>
<td align="center">99.26%</td>
<td align="center">95.70%</td>
</tr>
<tr>
<td align="center">180</td>
<td align="center">96.60%</td>
<td align="center">98.34%</td>
<td align="center">93.49%</td>
<td align="center">98.07%</td>
<td align="center">99.32%</td>
<td align="center">95.81%</td>
</tr>
<tr>
<td align="center">190</td>
<td align="center">96.63%</td>
<td align="center">98.38%</td>
<td align="center">93.53%</td>
<td align="center">97.98%</td>
<td align="center">99.20%</td>
<td align="center">95.83%</td>
</tr>
<tr>
<td align="center">200</td>
<td align="center">96.70%</td>
<td align="center">98.55%</td>
<td align="center">93.51%</td>
<td align="center">98.00%</td>
<td align="center">99.14%</td>
<td align="center">96.03%</td>
</tr>
<tr>
<td align="center">210</td>
<td align="center">96.77%</td>
<td align="center">98.42%</td>
<td align="center">93.91%</td>
<td align="center">97.99%</td>
<td align="center">99.02%</td>
<td align="center">96.21%</td>
</tr>
<tr>
<td align="center">220</td>
<td align="center">96.70%</td>
<td align="center">98.35%</td>
<td align="center">93.90%</td>
<td align="center">97.94%</td>
<td align="center">98.94%</td>
<td align="center">96.23%</td>
</tr>
<tr>
<td align="center">230</td>
<td align="center">96.75%</td>
<td align="center">98.34%</td>
<td align="center">94.15%</td>
<td align="center">98.03%</td>
<td align="center">99.07%</td>
<td align="center">96.33%</td>
</tr>
<tr>
<td align="center">240</td>
<td align="center">96.92%</td>
<td align="center">98.57%</td>
<td align="center">94.26%</td>
<td align="center">98.08%</td>
<td align="center">99.00%</td>
<td align="center">96.61%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In comparing the recognition accuracies achieved by random forest and SVC methods, several key observations emerge. Regarding average accuracy, random forest demonstrates results ranging from approximately 96.52%&#x2013;96.92%, while SVC exhibits a slightly higher range of around 97.87%&#x2013;98.08%. Both methods exhibit an increase in accuracy with larger training sizes, with random forest&#x2019;s accuracy gradually ascending and SVC&#x2019;s accuracy following a similar trend, albeit with minor fluctuations.</p>
<p>In terms of category-specific accuracies, random forest achieves accuracy rates between approximately 93.25% and 94.26% in the yellow category, whereas SVC yields higher accuracy within the range of 95.68%&#x2013;96.61%. For the non-yellow category, random forest consistently attains commendable accuracy, hovering between roughly 98.23% and 98.57%, whereas SVC shows even greater accuracy, ranging from approximately 98.94%&#x2013;99.32%, generally surpassing random forest.</p>
<p>The consistency of performance across training sizes and categories is notable in the random forest&#x2019;s case, where stability is observed. On the other hand, SVC displays slight performance variations, particularly noticeable within the yellow category. In the broader context of comparison, SVC emerges as the more favorable option, showcasing superior performance across most categories and training sizes. While random forest performs admirably in the non-yellow category, it falls short of SVC&#x2019;s accuracy levels in the yellow category. This analysis underscores the nuanced strengths of each method and the importance of considering the specific problem context when selecting an appropriate machine learning approach.</p>
</sec>
</sec>
<sec id="s3-3">
<title>3.3 Discussion of the proposed recognition methods</title>
<p>Up to this point, the task of recognizing yellow-seeded varieties has been effectively accomplished through the application of hyperspectral technology. Now, we would like to delve into the details of the four proposed models.</p>
<p>Beginning with the PLSR-based model, our approach involves identifying yellow-seeded varieties by predicting the RGB values through three essential trilateral parameters obtained from hyperspectral imaging of rapeseed, along with three significant spectral indices. During the process of predicting each R/G/B channel, we extract several noteworthy spectral features that contribute to enhancing the model&#x2019;s interpretability. It&#x2019;s important to note that the success of this method relies heavily on the accuracy of RGB calibration. Moving on to the Logit-R model, our strategy revolves around determining yellow-seeded or non-yellow-seeded categorization based on generating probabilities. However, one potential challenge of this model lies in dealing with imbalanced sample data. To address this, when data imbalance is encountered, it&#x2019;s essential to consider adjusting classification thresholds to ensure accurate results. The optimal hyperspectral feature chosen for both the aforementioned models is determined through a thorough correlation analysis between the R/G/B values and the 23 trilateral parameters and spectral indices derived from a complete band combination. It&#x2019;s worth mentioning that this approach might potentially omit some information from the original spectral reflectance data. Diverging from the two aforementioned methods, the machine learning models operate differently. In this case, we initially conduct feature dimensionality reduction from a total of 633 features, encompassing all 23 trilateral parameters, 9 spectral indices, and reflectance data from 601 original bands. Subsequently, we select ten key features to input into the random forest and SVC models.</p>
<p>All four models demonstrate high average accuracy rates, showcasing relatively similar performance differences ranging from 93% to 98%. This consistency highlights the feasibility of the framework that combines spectral features with intelligent models for accurately identifying yellow-seeded <italic>B. napus</italic> varieties. Considering factors like ease of operation and comprehensive utilization of information, the SVC model is recommended as an optimal choice for the task of identifying yellow-seeded varieties.</p>
</sec>
</sec>
<sec id="s4">
<title>4 Discussions and conclusion</title>
<p>Remote sensing technology, recognized as an essential national strategy, finds extensive application across both military and civilian domains. It facilitates the efficient acquisition of spectral data, enabling tasks like land classification and parameter inversion that are challenging for vision-based systems. Hyperspectral imaging technology, a near-Earth remote sensing tool, forms the basis for this advancement. As an innovative method of photoelectric detection and recognition, it integrates spectroscopy with optical imaging, offering a non-destructive and highly efficient alternative to traditional empirical and lab-based approaches for discerning the color of rapeseed seeds. Leveraging the rich spectral and image data inherent to rapeseed samples, this technology holds great promise for agricultural applications.</p>
<p>Comparing yellow seeds with black and brown seeds in Brassica napus reveals that yellow seeds have a thinner seed coat, higher oil content, and better quality. They also have higher protein content in the cake, lower cellulose and polyphenol levels, and higher economic value. Breeding yellow-seed varieties has become a key goal in rapeseed breeding worldwide. However, the complex seed color and inconsistent standards in current identification methods pose challenges. Most researchers use the naked eye or RGB color systems for seed color identification. However, the inconsistent phenotypic color and environmental influences make RGB methods unstable. In contrast, hyperspectral technology, which detects internal seed quality, is less affected by surface color, providing more stable results.</p>
<p>In this study, we introduce four intelligent models carefully designed to distinguish yellow-seeded rapeseed, as depicted in the model flowchart in <xref ref-type="fig" rid="F9">Figure 9</xref>. The first two models, PLSR and Logit-R, synergize spectral indices with hyperspectral trilateral parameters. This process begins with extracting three spectral indices and 23 trilateral parameters. Through correlation analyses across the R, G, and B color channels of rapeseed seeds, we determine the optimal combinations of these spectral indices and trilateral parameters.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Flowchart of identification modeling.</p>
</caption>
<graphic xlink:href="fgene-15-1518205-g009.tif"/>
</fig>
<p>The PLSR model leverages six features derived from three spectral indices and three trilateral parameters, achieving an impressive recognition accuracy (RA) between 92.32% and 96.55% in differentiating yellow from non-yellow seeds. The Logit-R model, which prioritizes the three spectral indices combined with the R channel, achieves a remarkable RA of 98%.</p>
<p>Additionally, we employ two machine learning models-random forest and SVC-to tackle the identification task. Beyond the 23 trilateral parameters and nine optimal spectral indices, we include the original 601 spectral reflectance values in the feature set. Using lasso-penalized logistic regression, we identify ten key features, which serve as input for the random forest and SVC models, achieving an average RA of approximately 98%, with SVC slightly outperforming random forest.</p>
<p>We emphasize that the proposed identification framework for yellow-seeded rapeseed, which integrates classical statistical methods and advanced machine learning tools, demonstrates robust generalizability. This framework is not limited to rapeseed classification but holds significant potential for application to seed classification and identification tasks across a wide range of other crops. By combining hyperspectral feature extraction with predictive modeling techniques, it provides a versatile approach that can adapt to various seed types, accommodating their unique physical and spectral characteristics. This generalizability makes it a valuable tool for advancing precision agriculture and improving the efficiency of crop breeding programs. Additionally, the framework&#x2019;s ability to extract internal quality information and analyze large-scale data through machine learning models makes it adaptable for various agricultural tasks, including crop variety identification, stress detection, and quality assessment across different agricultural production systems. By customizing the spectral features and models for specific crops, this framework can be effectively extended to other agricultural systems, enhancing precision farming and crop management in diverse contexts.</p>
<p>This study identifies several limitations and proposes future research directions. It suggests integrating machine vision with machine learning for rapeseed color recognition as a cost-effective alternative to hyperspectral feature fusion, which remains expensive. Machine vision, efficient for non-destructive small-target color recognition, contrasts with hyperspectral remote sensing, which excels in large-area identification. A promising approach involves combining hyperspectral remote sensing with intelligent models, establishing a key paradigm for agricultural monitoring. Future work will focus on integrating machine vision and hyperspectral remote sensing to enhance rapeseed color recognition across broader areas.</p>
<p>Second, this study is limited by the small sample size and narrow color range, based on two <italic>B. napus</italic> varieties from a single field trial in Changsha (2020&#x2013;2021). As an initial exploration of hyperspectral technology and machine learning for yellow-seeded rapeseed identification, it provides valuable insights but requires expansion. Future research will include more rapeseed varieties and account for environmental factors like temperature, humidity, light, and altitude by incorporating multi-year, multi-location data for a comprehensive analysis of seed color variability.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec sec-type="author-contributions" id="s6">
<title>Author contributions</title>
<p>FL: Conceptualization, Formal Analysis, Methodology, Writing&#x2013;original draft. FW: Funding acquisition, Methodology, Supervision, Writing&#x2013;review and editing. ZZ: Validation, Writing&#x2013;review and editing. LC: Software, Visualization, Writing&#x2013;review and editing. JW: Formal Analysis, Software, Supervision, Writing&#x2013;review and editing. Y-GW: Formal Analysis, Software, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. This research was supported partially by the National Natural Science Foundation of China (Grant No. 12471489), the Key Research Project of the Department of Education of Hunan Province (CN) (Grant No. 22A0135), the Excellent Young Research Project of the Department of Education of Hunan Province (CN) (Grant No. 24B1085), the &#x201c;Chunhui&#x201d; Program Collaborative Scientific Research Project (202202004), and the Australian Research Council project (DP160104292).</p>
</sec>
<ack>
<p>We would like to thank the Oil Institute of Hunan Agricultural University for providing two experimental rapeseed varieties of Xiangyou 708 and Xiangyou 710. The author wishes to thank the reviewers and the handling editor for their constructive comments and suggestions, which led to a great improvement in the presentation of this work.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="ai-statement" id="s9">
<title>Generative AI statement</title>
<p>The author(s) declare that no Generative AI was used in the creation of this manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Auger</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Marnet</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gautier</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Maia-Grondard</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Leprince</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Renard</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>A detailed survey of seed coat flavonoids in developing seeds of brassica napus l</article-title>. <source>J. Agric. Food Chem.</source> <volume>58</volume>, <fpage>6246</fpage>&#x2013;<lpage>6256</lpage>. <pub-id pub-id-type="doi">10.1021/jf903619v</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baetzel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>L&#xfc;hs</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Badani</surname>
<given-names>A.-G.</given-names>
</name>
<name>
<surname>Friedt</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Development of segregating populations in the breeding of yellow-seeded winter rapeseed (brassica napus l.)</article-title>. <source>Proc. 11th Int. Rapeseed Congr.</source> <volume>1</volume>, <fpage>238</fpage>&#x2013;<lpage>242</lpage>.</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A back-propagation neural network model using hyperspectral imaging applied to variety nondestructive detection of cereal</article-title>. <source>J. Food Process Eng.</source> <volume>45</volume>, <fpage>e13973</fpage>. <pub-id pub-id-type="doi">10.1111/jfpe.13973</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/a:1010933404324</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Broeckx</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Vanmaercke</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Duchateau</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Poesen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A data-based landslide susceptibility map of africa</article-title>. <source>Earth-Science Rev.</source> <volume>185</volume>, <fpage>102</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1016/j.earscirev.2018.05.002</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Rapid nondestructive detecting of sorghum varieties based on hyperspectral imaging and convolutional neural network</article-title>. <source>J. Sci. Food Agric.</source> <volume>103</volume>, <fpage>3970</fpage>&#x2013;<lpage>3983</lpage>. <pub-id pub-id-type="doi">10.1002/jsfa.12344</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Research progress in seed coat color of yellow-seeded rapeseed</article-title>. <source>J. Henan Agric. Sci.</source> <volume>44</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.15933/j.cnki.1004-3268.2015.09.001</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Regularization paths for generalized linear models via coordinate descent</article-title>. <source>J. Stat. Softw.</source> <volume>33</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v033.i01</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Rapid quantitative analysis of adulterated rice with partial least squares regression using hyperspectral imaging system</article-title>. <source>J. Sci. Food Agric.</source> <volume>99</volume>, <fpage>5558</fpage>&#x2013;<lpage>5564</lpage>. <pub-id pub-id-type="doi">10.1002/jsfa.9824</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>S.-F.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Local wavelet packet decomposition of soil hyperspectral for som estimation</article-title>. <source>Infrared Phys. &#x26; Technol.</source> <volume>125</volume>, <fpage>104285</fpage>. <pub-id pub-id-type="doi">10.1016/j.infrared.2022.104285</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Application of fractional-order derivative in the quantitative estimation of soil organic matter content through visible and near-infrared spectroscopy</article-title>. <source>Geoderma</source> <volume>337</volume>, <fpage>758</fpage>&#x2013;<lpage>769</lpage>. <pub-id pub-id-type="doi">10.1016/j.geoderma.2018.10.025</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Local detrended fluctuation analysis for spectral red-edge parameters extraction</article-title>. <source>Nonlinear Dyn.</source> <volume>93</volume>, <fpage>995</fpage>&#x2013;<lpage>1008</lpage>. <pub-id pub-id-type="doi">10.1007/s11071-018-4241-y</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Extracting sensitive spectrum bands of rapeseed using multiscale multifractal detrended fluctuation analysis</article-title>. <source>J. Appl. Phys.</source> <volume>121</volume>. <pub-id pub-id-type="doi">10.1063/1.4978308</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Studies on the inheritance of yellow-seeded brassica napus l</article-title>. <source>Acta Agron. Sin. (China)</source>. <pub-id pub-id-type="doi">10.3321/j.issn:0496-3490.1992.04.001</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2001</year>). &#x201c;<article-title>Genetic study and commercial application of the yellow-seeded rapeseed (brassica napus l.)</article-title>,&#x201d; in <source>Proceedings of the international symposium on rapeseed science</source> (<publisher-loc>New York</publisher-loc>: <publisher-name>Science Press</publisher-name>), <fpage>19</fpage>&#x2013;<lpage>23</lpage>.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Hyperspectral redundancy detection and modeling with local hurst exponent</article-title>. <source>Phys. A Stat. Mech. its Appl.</source> <volume>592</volume>, <fpage>126830</fpage>. <pub-id pub-id-type="doi">10.1016/j.physa.2021.126830</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>A large insertion in bhlh transcription factor brtt8 resulting in yellow seed coat in brassica rapa</article-title>. <source>PLoS One</source> <volume>7</volume>, <fpage>e44145</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0044145</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X. L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Construction of near-infrared reflectance spectroscopy model for seed color of rapeseed</article-title>. <source>Chin. J. Oil Crop Sci.</source> <volume>34</volume>.</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Non-destructive discrimination of homochromatic foreign materials in cut tobacco based on vis-nir hyperspectral imaging</article-title>. <source>J. Sci. Food Agric.</source> <volume>103</volume>, <fpage>4545</fpage>&#x2013;<lpage>4552</lpage>. <pub-id pub-id-type="doi">10.1002/jsfa.12528</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Comparison of multinomial logistic regression and logistic regression: which is more efficient in allocating land use?</article-title> <source>Front. Earth Sci.</source> <volume>8</volume>, <fpage>512</fpage>&#x2013;<lpage>523</lpage>. <pub-id pub-id-type="doi">10.1007/s11707-014-0426-y</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Prediction of oleic acid content of rapeseed using hyperspectral technique</article-title>. <source>Appl. Sci.</source> <volume>11</volume>, <fpage>5726</fpage>. <pub-id pub-id-type="doi">10.3390/app11125726</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Rapeseed variety recognition based on hyperspectral feature fusion</article-title>. <source>Agronomy</source> <volume>12</volume>, <fpage>2350</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy12102350</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Identification and inheritance of a partially dominant gene for yellow seed colour in brassica napus</article-title>. <source>Plant Breed.</source> <volume>124</volume>, <fpage>9</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1111/j.1439-0523.2004.01051.x</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meacham-Hensold</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Montes</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guan</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ainsworth</surname>
<given-names>E. A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>High-throughput field phenotyping using hyperspectral reflectance and partial least squares regression (plsr) reveals genetic modifications to photosynthetic capacity</article-title>. <source>Remote Sens. Environ.</source> <volume>231</volume>, <fpage>111176</fpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2019.04.029</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meyer</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dimitriadou</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Hornik</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Weingessel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Leisch</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>C.-C.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Misc functions of the department of statistics (e1071), tu wien</article-title>. <source>R. Package</source> <volume>1</volume>, <fpage>7</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.32614/CRAN.package.e1071</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Munshi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zuidgeest</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Brussel</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>van Maarseveen</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Logistic regression and cellular automata-based modelling of retail, commercial and residential development in the city of ahmedabad, India</article-title>. <source>Cities</source> <volume>39</volume>, <fpage>68</fpage>&#x2013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.1016/j.cities.2014.02.007</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Winter wheat canopy water content monitoring based on spectral transforms and &#x201c;three-edge&#x201d;&#x2019; parameters</article-title>. <source>Agric. Water Manag.</source> <volume>240</volume>, <fpage>106306</fpage>. <pub-id pub-id-type="doi">10.1016/j.agwat.2020.106306</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Petisco</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Garc&#xed;a-Criado</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>V&#xe1;zquez-de Aldana</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>De Haro</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Garc&#xed;a-Ciudad</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Measurement of quality parameters in intact seeds of brassica species using visible and near-infrared spectroscopy</article-title>. <source>Industrial Crops Prod.</source> <volume>32</volume>, <fpage>139</fpage>&#x2013;<lpage>146</lpage>. <pub-id pub-id-type="doi">10.1016/j.indcrop.2010.04.003</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Pisner</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Schnyer</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>2020</year>). &#x201c;<article-title>Support vector machine</article-title>,&#x201d; in <source>Machine learning</source> (<publisher-name>Elsevier</publisher-name>), <fpage>101</fpage>&#x2013;<lpage>121</lpage>.</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Differential accumulation of phenolic compounds and expression of related genes in black-and yellow-seeded brassica napus</article-title>. <source>J. Exp. Bot.</source> <volume>64</volume>, <fpage>2885</fpage>&#x2013;<lpage>2898</lpage>. <pub-id pub-id-type="doi">10.1093/jxb/ert148</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sen</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sharma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kaur</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Banga</surname>
<given-names>S. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Near-infrared reflectance spectroscopy calibrations for assessment of oil, phenols, glucosinolates and fatty acid content in the intact seeds of oilseed brassica species</article-title>. <source>J. Sci. Food Agric.</source> <volume>98</volume>, <fpage>4050</fpage>&#x2013;<lpage>4057</lpage>. <pub-id pub-id-type="doi">10.1002/jsfa.8919</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sibanda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mutanga</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Dube</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Odindi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mafongoya</surname>
<given-names>P. L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The utility of the upcoming HyspIRI&#x2019;s simulated spectral settings in detecting maize gray leafy spot in relation to sentinel-2 MSI, VEN&#xb5;S, and landsat 8 OLI sensors</article-title>. <source>Agronomy</source> <volume>9</volume>, <fpage>846</fpage>. <pub-id pub-id-type="doi">10.3390/agronomy9120846</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Somers</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Rakow</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Prabhu</surname>
<given-names>V. K.</given-names>
</name>
<name>
<surname>Friesen</surname>
<given-names>K. R.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Identification of a major gene and rapd markers for yellow seed coat colour in brassica napus</article-title>. <source>Genome</source> <volume>44</volume>, <fpage>1077</fpage>&#x2013;<lpage>1082</lpage>. <pub-id pub-id-type="doi">10.1139/g01-097</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ta&#x144;ska</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rotkiewicz</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kozirok</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Konopka</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Measurement of the geometrical features and surface color of rapeseeds using digital image analysis</article-title>. <source>Food Res. Int.</source> <volume>38</volume>, <fpage>741</fpage>&#x2013;<lpage>750</lpage>. <pub-id pub-id-type="doi">10.1016/j.foodres.2005.01.008</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Therneau</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Atkinson</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ripley</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ripley</surname>
<given-names>M. B.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Package-rpart&#xe2;</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://cran.ma.ic.ac.uk/web/packages/rpart/rpart.%20pdf">https://cran.ma.ic.ac.uk/web/packages/rpart/rpart. pdf</ext-link>(accessed on 20 April 2016)</comment>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Nondestructive classification of soybean seed varieties by hyperspectral imaging and ensemble machine learning algorithms</article-title>. <source>Sensors</source> <volume>20</volume>, <fpage>6980</fpage>. <pub-id pub-id-type="doi">10.3390/s20236980</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Resynthesis of yellow-seeded brassica napus and comparative metabonomic analysis of differently colored seed coats</article-title>. <source>Mol. Plant Breed.</source>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.13271/j.mpb.022.003979</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jia</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Color discrimination based on hyperspectral imaging method</article-title>. <source>Spectrosc. Spectr. Analysis</source> <volume>38</volume>, <fpage>3310</fpage>&#x2013;<lpage>3314</lpage>. <pub-id pub-id-type="doi">10.3964/j.issn.1000-0593(2018)10-3310-05</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Noise-resistant spectral features for retrieving foliar chemical parameters</article-title>. <source>IEEE J. Sel. Top. Appl. Earth Observations Remote Sens.</source> <volume>10</volume>, <fpage>5369</fpage>&#x2013;<lpage>5380</lpage>. <pub-id pub-id-type="doi">10.1109/jstars.2017.2713039</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ji</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Hyperspectral imaging technology combined with deep forest model to identify frost-damaged rice seeds</article-title>. <source>Spectrochimica Acta Part A Mol. Biomol. Spectrosc.</source> <volume>229</volume>, <fpage>117973</fpage>. <pub-id pub-id-type="doi">10.1016/j.saa.2019.117973</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A reliable methodology for determining seed viability by using hyperspectral data from two sides of wheat seeds</article-title>. <source>Sensors</source> <volume>18</volume>, <fpage>813</fpage>. <pub-id pub-id-type="doi">10.3390/s18030813</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Seed color detection by computer technology in rapeseed</article-title>. <source>Chin. J. Oil Crop Sci.</source> <volume>28</volume>, <fpage>11</fpage>. <pub-id pub-id-type="doi">10.3321/j.issn:1007-9084.2006.01.003</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>