<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2024.1395760</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Estimation of soybean yield based on high-throughput phenotyping and machine learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Xiuni</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1757098"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Menggen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Shuyuan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Xiangyao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Lingxiao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Li</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2379338"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gao</surname>
<given-names>Yang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tang</surname>
<given-names>Fenda</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gong</surname>
<given-names>Tao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Wenyan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Mei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Chunyan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yu</surname>
<given-names>Liang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/521992"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Liu</surname>
<given-names>Weiguo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/374075"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Wenyu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Agronomy, Sichuan Agricultural University</institution>, <addr-line>Chengdu</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Sichuan Engineering Research Center for Crop Strip Intercropping System</institution>, <addr-line>Chengdu</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Key Laboratory of Crop Ecophysiology and Farming System in Southwest, Ministry of Agriculture</institution>, <addr-line>Chengdu</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Jinyoung Y. Barnaby, United States Department of Agriculture (USDA), United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Ram Kumar Basnet, Rijk Zwaan (Netherlands), Netherlands</p>
<p>Zihao Zheng, Syngenta (United States), United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Weiguo Liu, <email xlink:href="mailto:lwgsy@126.com">lwgsy@126.com</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>06</day>
<month>06</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1395760</elocation-id>
<history>
<date date-type="received">
<day>04</day>
<month>03</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>20</day>
<month>05</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Li, Chen, He, Xu, He, Wang, Gao, Tang, Gong, Wang, Xu, Liu, Yu, Liu and Yang</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Li, Chen, He, Xu, He, Wang, Gao, Tang, Gong, Wang, Xu, Liu, Yu, Liu and Yang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Soybeans are an important crop used for food, oil, and feed. However, China&#x2019;s soybean self-sufficiency is highly inadequate, with an annual import volume exceeding 80%. RGB cameras serve as powerful tools for estimating crop yield, and machine learning is a practical method based on various features, providing improved yield predictions. However, selecting different input parameters and models, specifically optimal features and model effects, significantly influences soybean yield prediction.</p>
</sec>
<sec>
<title>Methods</title>
<p>This study used an RGB camera to capture soybean canopy images from both the side and top perspectives during the R6 stage (pod filling stage) for 240 soybean varieties (a natural population formed by four provinces in China: Sichuan, Yunnan, Chongqing, and Guizhou). From these images, the morphological, color, and textural features of the soybeans were extracted. Subsequently, feature selection was performed on the image parameters using a Pearson correlation coefficient threshold &#x2265;0.5. Five machine learning methods, namely, CatBoost, LightGBM, RF, GBDT, and MLP, were employed to establish soybean yield estimation models based on the individual and combined image parameters from the two perspectives extracted from RGB images.</p>
</sec>
<sec>
<title>Results</title>
<p>(1) GBDT is the optimal model for predicting soybean yield, with a test set R2 value of 0.82, an RMSE of 1.99 g/plant, and an MAE of 3.12%. (2) The fusion of multiangle and multitype indicators is conducive to improving soybean yield prediction accuracy.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Therefore, this combination of parameters extracted from RGB images via machine learning has great potential for estimating soybean yield, providing a theoretical basis and technical support for accelerating the soybean breeding process.</p>
</sec>
</abstract>
<kwd-group>
<kwd>RGB</kwd>
<kwd>soybean</kwd>
<kwd>yield</kwd>
<kwd>machine learning</kwd>
<kwd>estimation</kwd>
</kwd-group>
<counts>
<fig-count count="11"/>
<table-count count="5"/>
<equation-count count="8"/>
<ref-count count="39"/>
<page-count count="17"/>
<word-count count="9099"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Breeding</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Soybeans, a crucial oilseed economic crop, serve as a significant source of plant protein and fat in human diets. In addition, soybeans are second only to cash food crops such as wheat, rice and corn, and their trade is the largest among all agricultural products (<xref ref-type="bibr" rid="B39">Zhou and Yang, 2021</xref>). In recent decades, China has faced severe soybean self-sufficiency. According to statistics from the U.S. Department of Agriculture, China&#x2019;s annual soybean imports exceed 100 million tons, with an average yield per unit area of only 132.4 kg/mu, which is significantly lower than the global average of 188.7 kg/mu. The economic returns from soybean cultivation are notably lower than those from summer crops such as corn, leading to a lack of enthusiasm among farmers for soybean cultivation (<xref ref-type="bibr" rid="B28">Ren et&#xa0;al., 2021</xref>). This situation perpetuates a negative cycle for soybean cultivation, emphasizing the importance of developing high-yield soybean varieties. Yield monitoring is a crucial parameter for assessing soybean productivity during the harvesting process. Traditional yield survey methods rely on the experience of farmers or professionals, primarily through destructive sampling, which is time-consuming, labor-intensive, and inherently uncertain. Therefore, nondestructive and accurate yield monitoring is highly important for soybean production. Yield is a comprehensive indicator influenced by factors such as genotype, the environment, and their interactions, making yield estimation highly challenging. To promote efficient soybean breeding, the following question arises: how can soybean yield be accurately and efficiently predicted?</p>
<p>In precision agriculture, a recent hotspot, nondestructive estimation technologies have been developed, providing new methods and means for crop growth estimation and demonstrating promising applications in crop yield estimation. Previous studies have shown that images captured by sensors such as RGB cameras (<xref ref-type="bibr" rid="B18">Ji et&#xa0;al., 2022</xref>), thermal infrared cameras (4), hyperspectral cameras (<xref ref-type="bibr" rid="B8">Chiozza et&#xa0;al., 2021</xref>), and computed tomography (CT) scanners (<xref ref-type="bibr" rid="B17">Hughes et&#xa0;al., 2017</xref>) can be used to extract multiple image traits. These traits can be used to establish predictive models for estimating crop yield. Among these sensors, thermal infrared (TIR) cameras operating under field conditions are strongly influenced by environmental temperature (<xref ref-type="bibr" rid="B15">Hu et&#xa0;al., 2017</xref>) and have very low resolution. Hyperspectral cameras, with multiple continuous bands, can acquire spectral images in various bands. However, due to the large amount of information, imaging is time-consuming, and image processing is slow. However, CT scanners are expensive and challenging to operate. In comparison, RGB cameras, as image acquisition devices, have the advantages of low information acquisition costs, small size, high resolution, and simple operation. These scanners have been widely used in crop monitoring (<xref ref-type="bibr" rid="B35">Yamaguchi et&#xa0;al., 2020</xref>). RGB images can record brightness values (DNs) of the red, green, and blue bands and, based on this, undergo color space conversion to calculate vegetation indices. Compared to spectral images or multisource data fusion, RGB images are correlated with a small amount of data and are easy to handle. Therefore, over the past decade, efforts have been made to develop the application of RGB cameras in crop yield estimation.</p>
<p>Machine learning (ML) is a significant branch of computer science, and with the continuous advancement of sensor technology and image-processing techniques, ML has found extensive applications in various aspects of precision agriculture research, including yield estimation. In 2021, Saul Justin Newman et&#xa0;al. demonstrated the potential of ML algorithms for robustly predicting important agronomic traits, including yield, and developing and testing new interpretable models in crop biology (9). As an emerging and more complex statistical model, ML can better describe the nonlinear relationship between input variables and predicted outcomes. Recent studies have consistently shown the significant advantages of this approach over linear models in yield prediction (<xref ref-type="bibr" rid="B6">Cao et&#xa0;al., 2022</xref>). ML algorithms have been widely used to establish predictive models relating image features to biological parameters. ML algorithms exhibit greater accuracy and efficiency than simple linear regression models (<xref ref-type="bibr" rid="B34">Wang et&#xa0;al., 2021</xref>).</p>
<p>Various methods have been proposed and applied to estimate crop yield (<xref ref-type="bibr" rid="B21">Li et&#xa0;al., 2021</xref>). employed the random forest method to achieve dynamic yield prediction for three crops in China&#x2014;winter wheat, corn, and rice. They explored the optimal lead time for yield prediction for different crops and assessed the importance of various predictive factors. Minghan Cheng et&#xa0;al. conducted research on a prediction algorithm for Chinese corn yield using two machine learning methods, random forest regression (RFR) and gradient boosting decision trees (GBDTs). Their results showed that earlier lead times resulted in lower prediction accuracy, but the accuracy remained relatively high within at least 24 days before maturity (coefficient of determination (R<sup>2</sup>)&gt;0.77, relative root mean square error (rRMSE)&lt;16.92%) (<xref ref-type="bibr" rid="B7">Cheng et&#xa0;al., 2022</xref>, <xref ref-type="bibr" rid="B19">Jin et&#xa0;al., 2017</xref>). developed a method for winter wheat yield estimation by combining the AquaCrop model with optical and radar imaging data using a location and orientation system algorithm, which showed a high correlation between the predicted and measured yields (<xref ref-type="bibr" rid="B11">Gilliot et&#xa0;al., 2020</xref>). demonstrated the potential of predicting corn yield based on extracted plant height from images (<xref ref-type="bibr" rid="B10">Feng et&#xa0;al., 2020</xref>). used ensemble machine learning models for in-season alfalfa yield estimation (<xref ref-type="bibr" rid="B32">Sun et&#xa0;al., 2020</xref>). developed six mainstream machine learning models to estimate potato tuber yield and obtained satisfactory results. Maitiniyazi Maimaitijiang et&#xa0;al (<xref ref-type="bibr" rid="B6">Cao et&#xa0;al., 2022</xref>). demonstrated that using low-cost drones for multimodal data fusion under a deep neural network (DNN) framework can provide relatively accurate and robust soybean yield estimates. However, the predictive performance of models varies for different crops and environmental parameters, and limited research has explored the effects of different machine learning models on the prediction of individual soybean plant yields for multiple varieties.</p>
<p>The gradient boosting decision tree (GBDT) model is an additive model and a form of boosting in ensemble learning (<xref ref-type="bibr" rid="B31">Shi et&#xa0;al., 2018</xref>). This model reduces the residuals during training by continually combining linear combinations of functions to achieve regression. The light gradient boosting machine (LightGBM) is another popular gradient boosting method known for reducing errors, thereby improving accuracy and speed. However, this approach does not support string-type data and requires special algorithms for splitting categorical data, as it requires integer values (such as indices) instead of column string names (<xref ref-type="bibr" rid="B5">Brinkhoff et&#xa0;al., 2023</xref>; <xref ref-type="bibr" rid="B29">Seireg et&#xa0;al., 2023</xref>). The categorical boosting (CatBoost) algorithm, an open-source machine learning library released by the Russian search giant Yandex in 2017, is also part of the boosting algorithm series. CatBoost is a novel machine learning algorithm framework based on the gradient boosting decision tree (GBDT). In contrast to LightGBM, CatBoost can automatically convert strings into index values and handle missing numerical values. Unlike traditional neural network models, CatBoost does not require many samples for training; it adapts well to training with small-scale samples and provides high-precision diagnostics. The advantages of CatBoost include overcoming gradient bias, effectively addressing prediction bias, improving algorithm accuracy, enhancing generalizability, and preventing overfitting (<xref ref-type="bibr" rid="B16">Huang, 2020</xref>; <xref ref-type="bibr" rid="B23">Liu, 2020</xref>; <xref ref-type="bibr" rid="B24">Lu et&#xa0;al., 2022</xref>).</p>
<p>The random forest (RF) algorithm was proposed by Breiman in 2001 and is an ensemble machine learning method based on multiple classification regression trees (<xref ref-type="bibr" rid="B4">Breiman, 2001</xref>). The basic concept involves creating homogeneous subsets through bootstrapping and growing decision trees in each subset (number of trees: ntree) from the training dataset. The final result of RF regression is obtained by averaging all the decision trees (<xref ref-type="bibr" rid="B4">Breiman, 2001</xref>). Due to repeated sampling, RF regression can effectively reduce overfitting (<xref ref-type="bibr" rid="B4">Breiman, 2001</xref>).</p>
<p>The multilayer perceptron (MLP) model is a simple neural network and one of the earliest models in artificial intelligence. This model is the most widely used artificial intelligence model in all scientific numerical modeling fields (<xref ref-type="bibr" rid="B26">Paswan and Begum, 2013</xref>; <xref ref-type="bibr" rid="B20">Khalifani et&#xa0;al., 2022</xref>). MLPs typically include a set of sensory units (basic neurons) and consist of an input layer, one to several hidden layers, and an output layer. This method creates nonlinear mappings between input target samples, and input signals from the input layer to the output layer propagate forward (<xref ref-type="bibr" rid="B1">Aghelpour and Varshavian, 2021</xref>).</p>
<p>The development of nondestructive estimation techniques enables efficient and accurate monitoring of soybean yield, significantly shortening the time required for soybean breeding, meeting the needs of breeders, and facilitating efficient breeding. Therefore, the purpose of this study was to evaluate the accuracy of soybean yield estimation using five machine learning algorithms (CatBoost, LightGBM, RF, GBDT, and MLP) and to determine the optimal model for early soybean yield estimation using phenotypic features extracted from multiangle RGB images. This approach aims to increase the efficiency of obtaining soybean biological traits and accelerate the soybean breeding process.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Experimental site overview</title>
<p>The experiment was conducted during 2022&#x2013;2023 at the Chongzhou Experimental Base of Sichuan Agricultural University (103&#xb0;39&#x2019;E, 30&#xb0;33&#x2019;N), as depicted in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>. This region has a subtropical monsoon climate, with an average temperature of 16.2&#xb0;C, an annual total sunshine duration of 1400 hours, and an annual total rainfall of 918 mm. The basic chemical properties of the 0&#x2013;20 cm soil layer at the experimental site were as follows: organic matter content, 24.3 g&#xb7;kg<sup>-1</sup>; total potassium, 15.2 g&#xb7;kg<sup>-1</sup>; total nitrogen, 1.6 g&#xb7;kg<sup>-1</sup>; total phosphorus, 1.3 g&#xb7;kg<sup>-1</sup>; available potassium, 169.4 mg&#xb7;kg<sup>-1</sup>; available nitrogen, 299.5 mg&#xb7;kg<sup>-1</sup>; and available phosphorus, 36.5 mg&#xb7;kg<sup>-1</sup>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Study area and experimental design. <bold>(A)</bold> Geographic location of the Sichuan Agricultural University Modern Agriculture Research and Development Base; <bold>(B)</bold> sole cropping of soybeans; and <bold>(C)</bold> strip intercropping of corn and soybeans.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Experimental design</title>
<p>The experimental materials consisted of 240 soybean varieties (a natural population formed by four provinces in China: Sichuan, Yunnan, Chongqing, and Guizhou) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Appendix 3</bold>
</xref>). As shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>, the genetic diversity of this population is extremely extensive, and all of these populations were planted in 2022. In 2023, based on the previous year&#x2019;s yield, extremely low-performing varieties were excluded, resulting in the final cultivation of 202 soybean varieties. Over the two years of field experiments, each variety was subjected to three replications and two planting methods to increase yield differences (sole cropping and strip intercropping with corn). In the strip intercropping system with corn, the corn variety used was Zhongyu 3, a semicompact spring corn. The planting materials used were provided by the Crop Strip Composite Planting Engineering Technology Research Center of the College of Agronomy, Sichuan Agricultural University. The field layout is shown in <xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1B, C</bold>
</xref>. In the corn&#x2013;soybean strip intercropping system, two rows of corn (corn strip) were intercropped with two rows of soybean (soybean strip), with a length of 20 m and a width of 2 m (the row spacing for both the corn-corn and soybean-soybean systems was 40 cm, and the spacing between the corn and soybean strips was 60 cm). Both corn and soybean were single-hole planted, with a hole spacing of 20 cm for corn. For soybean, pots were planted with a diameter of 25 cm, a diameter of 20 cm, and a height of 25 cm; the pots were filled with 10 kg of soil. Under the intercropping treatment, the potted soybeans were placed in wide rows of corn, with two pots placed side by side in each strip. The soybean plant density and row spacing under the monocropping treatment were consistent with those under the intercropping treatment. The base fertilizer for corn was compound fertilizer (N:P:K = 13:5:7) applied at a rate of 923 kg&#xb7;hm<sup>-2</sup>. At the jointing and tasseling stages, urea (N &#x2265; 46%) was applied at rates of 98 kg&#xb7;hm<sup>-2</sup> and 163 kg&#xb7;hm<sup>-2</sup>, respectively. No fertilizer was applied throughout the entire growth period of the soybeans.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>High-throughput phenotypic data acquisition</title>
<p>The flowchart depicted in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> illustrates the methodology employed in this study for obtaining high-throughput soybean phenotypic data. This process included image acquisition, image segmentation (offline model training and online image segmentation), and parameter extraction. The details of this flowchart are discussed below. In this study, a total of three categories of parameters were extracted from two shooting angles, including 6 color parameters each for the top and side views, 17 textural parameters each for the top and side views, and 16 and 30 morphological parameters for the top and side views, respectively (refer to <xref ref-type="supplementary-material" rid="SM1">
<bold>Appendix 1</bold>
</xref>). In this research, the color, texture, and morphological parameters from the top and side views were individually or collectively used to estimate soybean yield.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>High-throughput phenotyping of soybeans.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g002.tif"/>
</fig>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Image acquisition</title>
<p>In 2022&#x2013;2023, we utilized a self-developed single soybean plant imaging platform from Sichuan Agricultural University as the capture platform. This platform, centered on an automatic rotating table, is equipped with industrial cameras on both the top and side of the table. The table rotation speed and number of cycles are controlled by a programmable logic controller (PLC). The selected Hikvision industrial cameras (MV-CH250&#x2013;90GC, China) paired with Hikvision robot lenses (MVL-KF1624M-25MP, focal length 16 mm, maximum aperture F2.4, 1.2 C, Hangzhou, China) were used as sensors for capturing images. During the capture process, the camera parameters were set as follows: focal lengths for the side and top cameras were 2.3 mm and 2.4 mm, respectively; shooting distances were 2.6 m and 1.8 m, respectively; and the camera mode was set to aperture priority (AV) with an aperture size of 2.4 and automatic white balance, ensuring a camera frame rate &#x2265;4.5 fps. The side and top images were stored in JPG format with resolutions of 4000*4000 and 4604*4604, respectively. A white standard board with a diameter of 30 cm was used as the scale, and a scale image of both the top and side views was collected to calculate the values of the extracted image features.</p>
<p>RGB images were collected during the R6 stage (pod filling stage) of soybeans. Each time, images were captured by randomly selecting 3 pots from each treatment. The soybean plants were placed on the turntable, and every 60&#xb0; rotation, a side image was obtained. Additionally, a random overhead view was captured. In total, one overhead view and six side views were collected for each soybean plant. A total of 18,564 images were captured, 15,912 of which were collected in 2022 (8,640 side views and 1,440 top views), and 8,484 were captured in 2023 (7,272 side views and 1,212 top views). The specific imaging process is illustrated in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Image segmentation</title>
<p>The soybean plant segmentation model utilized the U-Net neural network. In this study, 2000 images were used as the training set to train U-Net. The images were divided into training, testing, and validation sets at a ratio of 8:1:1. The U-net network was pretrained using the VOC 2012 dataset to enhance its feature extraction capability, and the obtained weights were utilized for model training. Subsequently, transfer learning was performed using the pretrained weights to conduct formal training on U-Net. The training was conducted on a computer with a Windows 10 system using a resolution of 2048&#xd7;2048 and an NVIDIA GeForce RTX 3090 with 48 GB of memory. The training was implemented based on the PyTorch framework. The training process comprised two stages: the first stage involved freezing the main feature extraction network and enhancing the weights of the feature extraction network, training only the classification network. The parameters were adjusted as follows: learning rate = 110^-4, epochs = 60, batch size = 4, and learning rate decay = 0.92. In the second stage, the feature extraction network was unfrozen, and the entire network was trained. The parameters were adjusted as follows: learning rate = 110^-5, epochs = 50, batch size = 1, and learning rate decay = 0.95.</p>
</sec>
<sec id="s2_3_3">
<label>2.3.3</label>
<title>Image parameter extraction</title>
<sec id="s2_3_3_1">
<label>2.3.3.1</label>
<title>Color features</title>
<p>Extraction was performed on the three channels (R, G, and B) of the finely segmented color image to calculate color trait values. The color parameters extracted in this study included the blue, green, red, blue-green, blue-red, and green-red ratios, comprising six indicators. The calculation formulas are as follows <xref ref-type="disp-formula" rid="eq1">Equations (1</xref>&#x2013;<xref ref-type="disp-formula" rid="eq3">3)</xref>:</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mi>G</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>G</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>B</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In the formulas, Ri represents the pixel value of the red channel for the i-th pixel of the plant, R denotes the red mean, Gi represents the pixel value of the green channel for the i-th pixel of the plant, G denotes the green mean, Bi represents the pixel value of the blue channel for the i-th pixel of the plant, and B denotes the blue mean. n represents the number of pixels in the plant.</p>
<p>For each image, a set of R, G, and B values can be obtained, and the values of the side color parameters for each plant are the averages of these values from six images. The blue-green ratio, blue-red ratio, and green-red ratio are then calculated as the ratios of the blue mean to the green mean, the blue mean to the red mean, and the green mean to the red mean, respectively.</p>
</sec>
<sec id="s2_3_3_2">
<label>2.3.3.2</label>
<title>Textural features</title>
<p>Image parameter extraction was conducted using Python 3.7 (Python Software Foundation, <ext-link ext-link-type="uri" xlink:href="https://www.python.org/">https://www.python.org/</ext-link>) and the scikit-learn library v0.21.3. Textural processing is a common method for extracting information from digital images, and although it lacks a formal definition, an intuitive description of textural information captures its properties well. Textural computation involves two main approaches: spectral methods based on the properties of the Fourier spectrum and detection of the global periodicity of the image by identifying high-energy narrow peaks in the spectrum (<xref ref-type="bibr" rid="B3">Bharati et&#xa0;al., 2004</xref>). On the other hand, statistical methods can extract the directionality, roughness, and degree of order in images. Textural traits were calculated using the gray-level co-occurrence matrix (GLCM), which was initially proposed by Hong Jiguang (<xref ref-type="bibr" rid="B14">Hong, 1984</xref>). By combining the overall soybean textural gray-level division, the color space of the color image was converted to the HIS color space, with the I channel serving as the grayscale image. The specific calculation formula is as follows <xref ref-type="disp-formula" rid="eq4">Equation (4)</xref>:</p>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mfrac>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mn>3</mml:mn>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The element H(i, j) in the gray-level co-occurrence matrix is defined as the total number of pixels with a normalized grayscale of i in the grayscale image and a normalized gradient of j in the gradient image. The probability of having a grayscale value of i and a gradient value of j is calculated as follows <xref ref-type="disp-formula" rid="eq5">Equation (5)</xref>:</p>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>.</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi>H</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">/</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>f</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where i = 0, 1, 2&#x2026;, <italic>Nf</italic> represents the normalized maximum grayscale value and j = 0, 1, 2&#x2026;; a total of 15 textural traits were obtained. In addition, two histogram traits were included in this study. The textural parameters on the side were the averages of six images. The specific calculation formulas are provided in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Formulas for Textural Parameter Calculations.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Full name</th>
<th valign="middle" align="center">Calculation formula</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">1</td>
<td valign="middle" align="left">Small gradient advantage</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>1</mml:mn>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mtext>H</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mtext>j</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">/</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mtext>H</mml:mtext>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mtext>i</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mtext>j</mml:mtext>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">2</td>
<td valign="middle" align="left">Large gradient advantage</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>2</mml:mn>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:msup>
<mml:mi>j</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mtext>H</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mtext>j</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">/</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mtext>H</mml:mtext>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mtext>i</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mtext>j</mml:mtext>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">3</td>
<td valign="middle" align="left">energy</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>3</mml:mn>
<mml:mo>=</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mtext>j</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mtext>i</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mtext>j</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">4</td>
<td valign="middle" align="left">The gradient distribution has inhomogeneity</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im4">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>4</mml:mn>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">/</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>H</mml:mi>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">5</td>
<td valign="middle" align="left">Gradient average</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im5">
<mml:mrow>
<mml:msub>
<mml:mtext>&#x3bc;</mml:mtext>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mi>j</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">6</td>
<td valign="middle" align="left">Gradient entropy</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im6">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>5</mml:mn>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>*</mml:mo>
<mml:mi>log</mml:mi>
</mml:mrow>
</mml:mstyle>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>P</mml:mi>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">7</td>
<td valign="middle" align="left">Grayscale entropy</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im7">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>6</mml:mn>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>*</mml:mo>
<mml:mi>log</mml:mi>
</mml:mrow>
</mml:mstyle>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>P</mml:mi>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">8</td>
<td valign="middle" align="left">Mixed entropy</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im8">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>7</mml:mn>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>*</mml:mo>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">9</td>
<td valign="middle" align="left">Differential moment</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im9">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>8</mml:mn>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mi>P</mml:mi>
</mml:mstyle>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">10</td>
<td valign="middle" align="left">Deficit moment</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im10">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>9</mml:mn>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">11</td>
<td valign="middle" align="left">Gradient standard deviation</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im11">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>{</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">[</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">]</mml:mo>
<mml:msup>
<mml:mo>}</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo stretchy="false">/</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">12</td>
<td valign="middle" align="left">Correlation</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im12">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>10</mml:mn>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>j</mml:mi>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">13</td>
<td valign="middle" align="left">Grayscale histogram variance</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im13">
<mml:mrow>
<mml:msup>
<mml:mi>S</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>255</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
</mml:msup>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mn>255</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">14</td>
<td valign="middle" align="left">Grayscale histogram entropy</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im14">
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>255</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mi>log</mml:mi>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">15</td>
<td valign="middle" align="left">The grayscale is unevenly distributed</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im15">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mn>11</mml:mn>
<mml:mo>=</mml:mo>
<mml:mo>{</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:msup>
<mml:mo stretchy="false">]</mml:mo>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>}</mml:mo>
<mml:mo stretchy="false">/</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">16</td>
<td valign="middle" align="left">Gray average</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im16">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>*</mml:mo>
<mml:mo stretchy="false">[</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td valign="middle" align="left">17</td>
<td valign="middle" align="left">Grayscale standard deviation</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im17">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>{</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>&#x3bc;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
<mml:mo stretchy="false">[</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>16</mml:mn>
</mml:mrow>
</mml:munderover>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">]</mml:mo>
<mml:msup>
<mml:mo>}</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo stretchy="false">/</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_3_3_3">
<label>2.3.3.3</label>
<title>Morphological features</title>
<p>The number of binary image pixels was calculated, and the side data represent the average of six sideview images. Definitions for each indicator are provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Appendix 2</bold>
</xref>.</p>
</sec>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Yield data collection</title>
<p>After the soybeans matured, manual collection and recording of individual soybean yields were conducted. The yield distribution is depicted in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, and the data for both years follow a normal distribution.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Normal distribution plot of manually measured individual soybean yields <bold>(A)</bold> 2381 trial materials. <bold>(B)</bold> 1291 training set materials. <bold>(C)</bold> 1091 test set materials.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g003.tif"/>
</fig>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Broad-sense heritability calculation</title>
<p>We evaluated the broad-sense heritability (<italic>H<sup>2</sup>
</italic>) of the data over the two years using the formula <italic>H<sup>2</sup>
</italic> = V<sub>g</sub>/(V<sub>g</sub> + V<sub>ll</sub>/n + V<sub>ly</sub>/n + V<sub>r</sub>/n<sup>2</sup>). Here, V<sub>g</sub> represents the genotypic variance, V<sub>ll</sub> represents the variance between varieties and locations, V<sub>ly</sub> represents the variance between varieties and years, and V<sub>r</sub> represents the residual variance, with n denoting the number of replicates. Means and standard deviations were calculated using BLUP values, and the statistical significance of P values was determined using paired <italic>t</italic> tests.</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Construction and evaluation of soybean yield estimation models</title>
<p>To further investigate the estimation accuracy of the yield prediction models, data preprocessing was performed using R Version 4.1.1 (R Foundation, Vienna, Austria). The outlier test function from the car package was utilized to remove outliers. A total of 149 outliers were eliminated from the 1440 datasets for 2022, and 121 outliers were removed from the 1212 datasets for 2023. Subsequent analyses were based on the remaining 2382 datasets. The statistical modeling was conducted using Python 3.7. In this study, five different regression methods were employed: CatBoost, LightGBM, RF, GBDT, and MLP. All the input parameters were normalized. The two years of data were divided into training and testing datasets based on the years. The samples from 2022, totaling 1291, were used as the training set, while those from 2023, totaling 1091, were used as the testing set. Tenfold cross-validation was also performed. All the numerical data were plotted using Origin 2019 and SPSS 2018. The data analysis methods employed in this study are illustrated in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Data analysis workflow.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g004.tif"/>
</fig>
<sec id="s2_6_1">
<label>2.6.1</label>
<title>Machine learning parameter adjustment</title>
<p>In this study, the loss functions for all five models were set to &#x2018;friedman_mse&#x2019;, and a grid search was employed for hyperparameter tuning. The final settings for the GBDT model were a learning rate of 0.1, a maximum depth of 5, and a maximum iteration count of 800. For the CatBoost model, the final setting was a learning rate of 0. 05, a maximum tree depth of 10, and a maximum iteration count of 2000. In the LightGBM model, the final settings were a learning rate of 0.1 and a maximum tree depth of 10. In the RSF model, the optimal number of trees (ntree) for soybean yield estimation was determined by testing ntree values from 100 to 500 in increments of 50. The value 300 was chosen because it achieved stable and relatively low mean absolute error (MAE) and high R<sup>2</sup> in the soybean yield estimation model. Other hyperparameters in the RF regression were set to the default values using the regressor function in the scikit-learn library. For the MLP model, the activation function was set to &#x2018;relu,&#x2019; regularization coefficient to 0.01, two hidden layers were established with 100 neurons in the first layer and 50 neurons in the second layer, the learning_rate was set to &#x2018;adaptive&#x2019;, and the solver was set to &#x2018;sgd.&#x2019;</p>
</sec>
<sec id="s2_6_2">
<label>2.6.2</label>
<title>Modeling evaluation</title>
<p>To reduce the impact of data partitioning on model estimation errors, the root mean square error (RMSE), MAE, and R<sup>2</sup> were calculated to assess the performance of each estimation method. The specific calculation formulas are as follows <xref ref-type="disp-formula" rid="eq6">Equation (6</xref>&#x2013;<xref ref-type="disp-formula" rid="eq8">8)</xref>:</p>
<disp-formula id="eq6">
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover>
<mml:mtext mathvariant="italic" mathsize="70%">yi</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:msqrt>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq7">
<label>(7)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover>
<mml:mtext mathvariant="italic" mathsize="70%">yi</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq8">
<label>(8)</label>
<mml:math display="block" id="M8">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover>
<mml:mtext mathvariant="italic" mathsize="75%">yi</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>i</mml:mi>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover>
<mml:mtext mathvariant="italic" mathsize="75%">yi</mml:mtext>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <inline-formula>
<mml:math display="inline" id="im18">
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mover>
<mml:mtext mathvariant="italic" mathsize="70%">yi</mml:mtext>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> represents the difference between the actual values and predicted values on the test set.</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Correlations between color, texture, and morphological parameters and yield</title>
<p>The red area indicates a negative correlation, while the blue area indicates a positive correlation. Lighter colors represent weaker correlations. As shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>, there were a total of 23 image indicators in the sideview that were absolute correlations (hereinafter referred to as correlations) with a yield greater than 0.5. Among the sideview color parameters, all the indicators were correlated with a yield less than 0.5 (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). Among the sideview morphological parameters, 13 indicators had a correlation with a yield greater than 0.5, and except for SPA2 and SCA, the other 11 indicators were positively correlated with yield (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>), indicating that an increase in these 11 indicators leads to an increase in soybean yield. Among the sideview textural parameters, 10 indicators were correlated with a yield greater than 0.5. Among them, SGD, SIG1, SE, and SDM were negatively correlated with yield, while SG, SGA, SGE1, SGE2, SME, and SHE were positively correlated with yield (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Correlation between three types of image parameters and yield. <bold>(A)</bold> Correlations between sideview color parameters and yield; <bold>(B)</bold> correlations between sideview morphology and yield; <bold>(C)</bold> correlations between sideview textural parameters and yield; <bold>(D)</bold> correlations between top-view color parameters and yield; <bold>(E)</bold> correlations between top-view morphology and yield; and <bold>(F)</bold> correlations between top-view textural parameters and yield.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g005.tif"/>
</fig>
<p>In the top view, a total of 16 image indicators were correlated with a yield greater than 0.5. According to the top-view color parameters, all the indicators were correlated with a yield less than 0.5 (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>). Among the top-view morphological parameters, 9 were correlated with a yield greater than 0.5, and all the indicators were positively correlated with yield (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5E</bold>
</xref>). Among the top-view textural parameters, 7 indicators exhibited a correlation with a yield greater than 0.5. Among them, TE, TDM, and TGH had negative correlations with yield, while TG, TGE1, TME, and THE had positive correlations with yield (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5F</bold>
</xref>).</p>
<p>An interesting phenomenon was observed here: the relationship between the image parameters and yield was quite similar between the side and top views. For example, SE and SDM exhibited a high negative correlation with yield, corresponding to TE and TDM, which also exhibited a high negative correlation with yield in the top-view image parameters. Similarly, SG, SGE1, SME, and SHE exhibited a high positive correlation with yield, corresponding to TG, TGE1, the TME, and the, which also showed a high positive correlation with yield in the top-view image parameters. Therefore, further exploration of the relationships between side- and top-view image parameters and soybean yield is particularly intriguing.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Prediction of yield based on sideview image parameters</title>
<p>The sideview image parameters with Pearson coefficients greater than 0.5 were selected for soybean yield estimation. In this study, the CatBoost, LightGBM, GBDT, RF, and MLP models were used to estimate soybean yield, and three combinations were trained and evaluated. The three combinations of input variables were named m1-m3, where m1 consists of morphological parameters (SPA1, SCA1, 1/5MW, 2/5MW, 3/5MW, 4/5MW, SMW, TC2, SMIW, SRA, SSC, SPA2, and SCA), m2 consists of textural parameters (SMG, SGD, SIG1, SE, SG, SGA, SGE1, SGE2, SME, and SDM), and m3 consists of morphological and textural parameters.</p>
<p>As shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>, the R<sup>2</sup> value on the training set was generally greater than that on the test set, and the RMSE and MAE were generally lower than those on the test set. For m1, the prediction accuracy of the five models on the test set fluctuated greatly, with 0.42 &#x2264; R<sup>2</sup> &#x2264; 0.77, and the GBDT and LightGBM models achieved the best prediction accuracy, both with R<sup>2</sup> values of 0.77. The performance accuracy of RF was the lowest, and the prediction accuracies of CatBoost and MLP were the lowest (R<sup>2</sup> &#x2264; 0.52), with the highest errors. For m2, the overall prediction accuracy of the five models was lower than that for m1, but the GBDT model still achieved the highest prediction accuracy, with R<sup>2 =</sup> 0.73, while CatBoost and MLP yielded the lowest prediction accuracies, with R<sup>2</sup> values of 0.49 and 0.44, respectively. For m3, after combining textural parameters with morphological parameters, the overall prediction accuracy of the five models slightly improved, with the MLP model showing the most significant improvement. According to <xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A&#x2013;I</bold>
</xref>, the error order is m2 &gt; m1 &gt; m3, and the R<sup>2</sup> order is m3 &gt; m1 &gt; m2. With the enrichment of indicators, the prediction accuracy increased, and the error decreased, with morphological parameters leading to better estimation performance than textural parameters. Overall, in the prediction of soybean yield based on sideview image parameters, the optimal predictive model was GBDT.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Prediction of yield based on sideview image parameters.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" colspan="2" align="center"/>
<th valign="top" colspan="3" align="center">m1</th>
<th valign="top" colspan="3" align="center">m2</th>
<th valign="top" colspan="3" align="center">m3</th>
</tr>
<tr>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" rowspan="2" align="center">CatBoost</td>
<td valign="top" align="center">Val</td>
<td valign="top" align="center">5.18</td>
<td valign="top" align="center">3.93</td>
<td valign="top" align="center">0.65</td>
<td valign="top" align="center">5.72</td>
<td valign="top" align="center">4.36</td>
<td valign="top" align="center">0.58</td>
<td valign="top" align="center">4.93</td>
<td valign="top" align="center">3.79</td>
<td valign="top" align="center">0.71</td>
</tr>
<tr>
<td valign="top" align="center">Cal</td>
<td valign="top" align="center">5.98</td>
<td valign="top" align="center">4.49</td>
<td valign="top" align="center">0.52</td>
<td valign="top" align="center">6.19</td>
<td valign="top" align="center">4.68</td>
<td valign="top" align="center">0.49</td>
<td valign="top" align="center">5.78</td>
<td valign="top" align="center">4.38</td>
<td valign="top" align="center">0.58</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">LightBoost</td>
<td valign="top" align="center">Val</td>
<td valign="top" align="center">1.49</td>
<td valign="top" align="center">1.03</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">2.56</td>
<td valign="top" align="center">1.88</td>
<td valign="top" align="center">0.88</td>
<td valign="top" align="center">1.17</td>
<td valign="top" align="center">0.82</td>
<td valign="top" align="center">0.94</td>
</tr>
<tr>
<td valign="top" align="center">Cal</td>
<td valign="top" align="center">3.88</td>
<td valign="top" align="center">2.56</td>
<td valign="top" align="center">0.77</td>
<td valign="top" align="center">5.05</td>
<td valign="top" align="center">3.48</td>
<td valign="top" align="center">0.66</td>
<td valign="top" align="center">3.85</td>
<td valign="top" align="center">2.46</td>
<td valign="top" align="center">0.78</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">GBDT</td>
<td valign="top" align="center">Val</td>
<td valign="top" align="center">1.58</td>
<td valign="top" align="center">1.46</td>
<td valign="top" align="center">0.9</td>
<td valign="top" align="center">1.62</td>
<td valign="top" align="center">1.57</td>
<td valign="top" align="center">0.89</td>
<td valign="top" align="center">1.49</td>
<td valign="top" align="center">1.55</td>
<td valign="top" align="center">0.92</td>
</tr>
<tr>
<td valign="top" align="center">Cal</td>
<td valign="top" align="center">4.02</td>
<td valign="top" align="center">2.48</td>
<td valign="top" align="center">0.77</td>
<td valign="top" align="center">3.12</td>
<td valign="top" align="center">2.85</td>
<td valign="top" align="center">0.73</td>
<td valign="top" align="center">4.10</td>
<td valign="top" align="center">2.32</td>
<td valign="top" align="center">
<bold>0.78</bold>
</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">RF</td>
<td valign="top" align="center">Val</td>
<td valign="top" align="center">1.35</td>
<td valign="top" align="center">1.02</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">2.01</td>
<td valign="top" align="center">1.35</td>
<td valign="top" align="center">0.91</td>
<td valign="top" align="center">1.24</td>
<td valign="top" align="center">0.81</td>
<td valign="top" align="center">0.95</td>
</tr>
<tr>
<td valign="top" align="center">Cal</td>
<td valign="top" align="center">3.49</td>
<td valign="top" align="center">2.15</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">5.10</td>
<td valign="top" align="center">3.65</td>
<td valign="top" align="center">0.71</td>
<td valign="top" align="center">3.5</td>
<td valign="top" align="center">2.41</td>
<td valign="top" align="center">0.77</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="center">MLP</td>
<td valign="top" align="center">Val</td>
<td valign="top" align="center">6.05</td>
<td valign="top" align="center">4.44</td>
<td valign="top" align="center">0.54</td>
<td valign="top" align="center">6.40</td>
<td valign="top" align="center">4.83</td>
<td valign="top" align="center">0.49</td>
<td valign="top" align="center">4.49</td>
<td valign="top" align="center">3.31</td>
<td valign="top" align="center">0.75</td>
</tr>
<tr>
<td valign="top" align="center">Cal</td>
<td valign="top" align="center">6.82</td>
<td valign="top" align="center">4.96</td>
<td valign="top" align="center">0.42</td>
<td valign="top" align="center">6.72</td>
<td valign="top" align="center">5.07</td>
<td valign="top" align="center">0.44</td>
<td valign="top" align="center">5.89</td>
<td valign="top" align="center">4.39</td>
<td valign="top" align="center">0.59</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Val for the validation set, Cal for the test set. The bold font represents the optimal predicted values.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Presents the statistical results of yield prediction cross-validation based on side image parameters. <bold>(A&#x2013;C)</bold> represent the RMSE of combinations m1-m3 across five machine learning models. <bold>(D&#x2013;F)</bold> represent the MAE of combinations m1-m3 across five machine learning models. <bold>(G&#x2013;I)</bold> represent the R<sup>2</sup> of combinations m1-m3 across five machine learning models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g006.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref> shows the statistical results of cross-validation for soybean yield prediction based on side-image parameters. It can be seen that m3 still performed the best overall, with the highest prediction accuracy for the GBDT model, followed by LightBoost. However, compared to the prediction results in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>, the overall prediction accuracy improved.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Yield prediction based on top-image parameters</title>
<p>The soybean yield was estimated using top-image parameters with a correlation greater than 0.5. The three combinations of input variables were named M1-M3; M1 consisted of morphological parameters (TPA1, TCA1, TRW, TRH, TCR, TRA, TCA2, TSC, and TCA3), M2 consisted of textural parameters (TGD, TE, TG, TGE1, TME, TDM, and TGH), and M3 consisted of a combination of morphological and textural parameters.</p>
<p>As shown in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>, the R<sup>2</sup> value on the training set was generally greater than that on the test set, and the RMSE and MAE were generally lower than those on the test set. For M1, the GBDT and LightGBM models achieved the best prediction accuracy, with R<sup>2</sup> values of 0.71 each. RF had an R<sup>2</sup> value of 0.67, while CatBoost and MLP had the lowest prediction accuracies (R<sup>2</sup> &#x2264; 0.45). For M2, the overall prediction accuracy of the five models was greater than that for M1 (except for CatBoost). However, the GBDT and LightGBM models still achieved the highest prediction accuracies, each with an R<sup>2</sup> value of 0.76, while CatBoost and MLP had the lowest prediction accuracies (R<sup>2</sup> &#x2264; 0.40), with the highest errors. For M3, the combination of textural and morphological parameters did not significantly improve the prediction accuracy of the five models. According to <xref ref-type="fig" rid="f7">
<bold>Figures&#xa0;7A&#x2013;I</bold>
</xref>, the error order is m2 &gt; m1 &gt; m3, and the R<sup>2</sup> value order is m3 &gt; m2 &gt; m1. With an increase in the richness of the indicators, the prediction accuracy increased, and the error decreased. The textural parameters led to better performance than the morphological parameters in estimating yield. <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref> shows the statistical results of cross-validation for soybean yield prediction based on the top-image parameters. M3 still performed the best overall, with the highest prediction accuracy for the GBDT model. Overall, in predicting soybean yield based on the top-image parameters, the best predictive model was GBDT, which was consistent with the conclusion in Section 3.2.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Prediction of yield based on top-image parameters.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" colspan="2" align="center"/>
<th valign="top" colspan="3" align="center">m1</th>
<th valign="top" colspan="3" align="center">m2</th>
<th valign="top" colspan="3" align="center">m3</th>
</tr>
<tr>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">CatBoost</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">5.99</td>
<td valign="bottom" align="center">4.44</td>
<td valign="bottom" align="center">0.53</td>
<td valign="bottom" align="center">6.14</td>
<td valign="bottom" align="center">4.61</td>
<td valign="bottom" align="center">0.52</td>
<td valign="bottom" align="center">5.84</td>
<td valign="bottom" align="center">4.38</td>
<td valign="bottom" align="center">0.56</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">6.35</td>
<td valign="bottom" align="center">4.84</td>
<td valign="bottom" align="center">0.45</td>
<td valign="bottom" align="center">6.39</td>
<td valign="bottom" align="center">4.91</td>
<td valign="bottom" align="center">0.45</td>
<td valign="bottom" align="center">6.25</td>
<td valign="bottom" align="center">4.79</td>
<td valign="bottom" align="center">0.47</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">LightBoost</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">1.88</td>
<td valign="bottom" align="center">1.47</td>
<td valign="bottom" align="center">0.89</td>
<td valign="bottom" align="center">2.12</td>
<td valign="bottom" align="center">1.68</td>
<td valign="bottom" align="center">0.89</td>
<td valign="bottom" align="center">1.63</td>
<td valign="bottom" align="center">1.27</td>
<td valign="bottom" align="center">0.91</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">4.38</td>
<td valign="bottom" align="center">2.85</td>
<td valign="bottom" align="center">0.71</td>
<td valign="bottom" align="center">3.29</td>
<td valign="bottom" align="center">2.75</td>
<td valign="bottom" align="center">0.75</td>
<td valign="bottom" align="center">4.05</td>
<td valign="bottom" align="center">2.61</td>
<td valign="bottom" align="center">0.75</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">GBDT</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">1.88</td>
<td valign="bottom" align="center">1.47</td>
<td valign="bottom" align="center">0.87</td>
<td valign="bottom" align="center">2.12</td>
<td valign="bottom" align="center">1.68</td>
<td valign="bottom" align="center">0.89</td>
<td valign="bottom" align="center">1.63</td>
<td valign="bottom" align="center">1.27</td>
<td valign="bottom" align="center">0.90</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">4.38</td>
<td valign="bottom" align="center">2.85</td>
<td valign="bottom" align="center">0.71</td>
<td valign="bottom" align="center">3.83</td>
<td valign="bottom" align="center">2.74</td>
<td valign="bottom" align="center">
<bold>0.76</bold>
</td>
<td valign="bottom" align="center">4.05</td>
<td valign="bottom" align="center">2.61</td>
<td valign="bottom" align="center">0.75</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">RF</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">0.60</td>
<td valign="bottom" align="center">1.90</td>
<td valign="bottom" align="center">0.89</td>
<td valign="bottom" align="center">0.56</td>
<td valign="bottom" align="center">2.12</td>
<td valign="bottom" align="center">0.9</td>
<td valign="bottom" align="center">0.66</td>
<td valign="bottom" align="center">1.74</td>
<td valign="bottom" align="center">0.90</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">0.49</td>
<td valign="bottom" align="center">4.43</td>
<td valign="bottom" align="center">0.67</td>
<td valign="bottom" align="center">0.58</td>
<td valign="bottom" align="center">3.21</td>
<td valign="bottom" align="center">0.70</td>
<td valign="bottom" align="center">0.71</td>
<td valign="bottom" align="center">3.06</td>
<td valign="bottom" align="center">0.67</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">MLP</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">6.84</td>
<td valign="bottom" align="center">5.15</td>
<td valign="bottom" align="center">0.40</td>
<td valign="bottom" align="center">6.82</td>
<td valign="bottom" align="center">5.15</td>
<td valign="bottom" align="center">0.42</td>
<td valign="bottom" align="center">6.72</td>
<td valign="bottom" align="center">5.03</td>
<td valign="bottom" align="center">0.43</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">6.95</td>
<td valign="bottom" align="center">5.07</td>
<td valign="bottom" align="center">0.38</td>
<td valign="bottom" align="center">6.90</td>
<td valign="bottom" align="center">5.08</td>
<td valign="bottom" align="center">0.40</td>
<td valign="bottom" align="center">6.59</td>
<td valign="bottom" align="center">4.84</td>
<td valign="bottom" align="center">0.47</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Val for the validation set, Cal for the test set. The bold font represents the optimal predicted values.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Presents the statistical results of yield prediction cross-validation based on top image parameters. <bold>(A&#x2013;C)</bold> represent the RMSE of combinations M1-M3 across five machine learning models. <bold>(D&#x2013;F)</bold> represent the MAE of combinations M1-M3 across five machine learning models. <bold>(G&#x2013;I)</bold> represent the R<sup>2</sup> of combinations M1-M3 across five machine learning models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g007.tif"/>
</fig>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Yield prediction based on side- and top-image parameters</title>
<p>Building on the results from the previous sections, the side- and top-image parameters were combined to estimate the soybean yield. The three combinations of input variables were named S1-S3: S1 (m1 + M1), S2 (m2 + M2), and S3 (m3 + M3). The prediction accuracies of the CatBoost, RF, and MLP models improved compared to those presented in the previous sections. Notably, the MLP model demonstrated the most significant improvement, with higher prediction accuracy as the input indicators became more diverse, reaching a maximum of 0.74. The GBDT model also exhibited improved prediction accuracy and reduced errors compared to those in the previous sections, with RMSE = 3.12 and MAE = 1.99 on the test set. Moreover, the GBDT model consistently performed well. According to <xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8A&#x2013;I</bold>
</xref>, the fusion of multiangle information contributed to reducing errors and enhancing the model prediction accuracy. In summary, the GBDT model is the optimal model for predicting soybean yield based on RGB image parameters. <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref> shows the statistical results of cross-validation for soybean yield prediction based on the side- and top-image parameters. The fusion of multiangle information helps reduce errors and improve the model&#x2019;s prediction accuracy.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Presents the statistical results of yield prediction cross-validation based on top image parameters. <bold>(A-C)</bold> represent the RMSE of combinations S1-S3 across five machine learning models. <bold>(D&#x2013;F)</bold> represent the MAE of combinations S1-S3 across five machine learning models. <bold>(G&#x2013;I)</bold> represent the R<sup>2</sup> of combinations S1-S3 across five machine learning models.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g008.tif"/>
</fig>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Importance of input parameters</title>
<p>Based on the results presented above, GBDT emerged as the best predictive model, achieving the highest R<sup>2</sup> value with the S3 combination while maintaining relatively low RMSE and MAE values. To further explore the contribution of each indicator and achieve high predictive accuracy with minimal input parameters, an analysis of the importance of each indicator with respect to the S3-GBDT combination was conducted.</p>
<p>As shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>, the importance of the SME far exceeded that of the other indicators. This heightened importance could be attributed to its association with texture and photosynthesis (<xref ref-type="bibr" rid="B13">Heckmann et&#xa0;al., 2017</xref>). In addition to the SME, indicators such as SGD, SG, SDM, and TSC also exhibited considerable importance.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Importance of optimal input parameters.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g009.tif"/>
</fig>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Selection of optimal input parameters</title>
<p>In the process of estimating crop yield based on remote sensing data, the selection of model variables is crucial (<xref ref-type="bibr" rid="B18">Ji et&#xa0;al., 2022</xref>). A comparison of the estimated soybean yield under the different numbers of input parameters (<xref ref-type="fig" rid="f10">
<bold>Figures&#xa0;10A&#x2013;C</bold>
</xref>) revealed that the RMSE, MAE, and R<sup>2</sup> values stabilized when the number of input parameters was equal to or greater than 15. To achieve high prediction accuracy with the most lightweight set of input parameters, we identified the 15 most common indicators (6 side textural indicators, 6 side morphological indicators, 1 top textural indicator, and 2 top morphological indicators) as the final selection of predictive parameters.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>RMSE, MAE, and R<sup>2</sup> values with different single seed weight input indices. <bold>(A)</bold> represent the RMSE. <bold>(B)</bold> represent the MAE. <bold>(C)</bold> represent the R<sup>2</sup>. The indicators are sequentially accumulated based on their importance. For instance, 1 item represents SME, 2 items represent SME + SGD, 3 items represent SME + SGD + SG, 4 items represent SME + SGD + SG + SDM, 5 items represent SME + SGD + SG + SDM + TSC, and so forth until all 39 indicators are included. The gray background indicates that, from the 15th item onward, the predictive performance of subsequent parameter combinations is comparable.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g010.tif"/>
</fig>
<p>Using these 15 indicators as input parameters for the five models, the prediction results are shown in <xref ref-type="fig" rid="f11">
<bold>Figure&#xa0;11</bold>
</xref>. The prediction accuracy significantly decreased in the MLP model, while the other four models showed no significant changes. In fact, the GBDT model exhibited a slight improvement in R<sup>2</sup> values. These results further emphasize that the effective selection of input indicators can greatly reduce the computational load while maintaining the prediction accuracy. Filtering out irrelevant information is advantageous for constructing a lightweight model.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Predictive performance of the five models with 15 input indicators. <bold>(A)</bold> CatBoost model; <bold>(B)</bold> LightBoost model; <bold>(C)</bold> GBDT model; <bold>(D)</bold> RF model; and <bold>(E)</bold> MLP model. T_Yield represents the manually measured actual yield, and P_Yield represents the predicted value. The black dashed line represents a 1:1 relationship, where red indicates the training set and blue indicates the test set.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1395760-g011.tif"/>
</fig>
<p>According to <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>, the broad-sense heritability of the 15 input parameters ranges from 0.68 to 0.84, with SME and SRA exhibiting the highest broad-sense heritability.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>The broad-sense heritability of the 15 input indicators.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" align="center">Indicators</th>
<th valign="middle" align="center">TRH</th>
<th valign="middle" align="center">TSC</th>
<th valign="middle" align="center">TG</th>
<th valign="middle" align="center">2_5_MW</th>
<th valign="middle" align="center">3_5_MW</th>
<th valign="middle" align="center">4_5_MW</th>
<th valign="middle" align="center">SRA</th>
<th valign="middle" align="center">SSC</th>
<th valign="middle" align="center">SPA2</th>
<th valign="middle" align="center">SGD</th>
<th valign="middle" align="center">SE</th>
<th valign="middle" align="center">SG</th>
<th valign="middle" align="center">SGE1</th>
<th valign="middle" align="center">SME</th>
<th valign="middle" align="center">SDM</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="bottom" align="center">
<italic>H<sup>2</sup>
</italic>
</td>
<td valign="middle" align="center">0.81</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.68</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.78</td>
<td valign="middle" align="center">0.68</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.73</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<sec id="s4_1">
<label>4.1</label>
<title>Extraction of image parameters</title>
<p>There has been extensive research on the use of RGB cameras to extract image parameters for predicting crop yields. However, previous studies have often had relatively narrow shooting angles, mostly capturing images from the top, leading to significant information loss. Moreover, in previous research, the focus was primarily on morphological indicators (<xref ref-type="bibr" rid="B25">Ma et&#xa0;al., 2022</xref>). reported a significant correlation between vegetation indices extracted from RGB images and cotton yield, suggesting that selecting optimal parameter features for cotton yield monitoring is feasible. However, from the perspective of model accuracy, there is room for improvement. Therefore, there is a need to extract more textural features or other color information from RGB images to enhance the model accuracy. Research by (<xref ref-type="bibr" rid="B2">Bai et&#xa0;al., 2022</xref>) also demonstrated that textural information has high potential for yield estimation. Building on previous studies, in this study, not only were the shooting angles expanded from the top and side, but three major categories of image parameters were also extracted&#x2014;morphology, color, and textural parameters. This approach significantly enriched the variety of image parameters, providing a broader selection for identifying the optimal image indicators in subsequent analyses.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Discussion on optimal input parameters</title>
<p>Indicator selection is a crucial step in machine learning. While algorithms determine the lower bounds of a model, input indicators set the upper bounds (<xref ref-type="bibr" rid="B25">Ma et&#xa0;al., 2022</xref>). The inclusion of a large amount of irrelevant input information can adversely affect model training, thereby impacting model accuracy. Therefore, a correlation analysis was initially conducted between all images and soybean yields, and only indicators with a Pearson correlation coefficient greater than 0.5 were obtained. This preliminary screening filtered out a significant amount of ineffective information.</p>
<p>After identifying GBDT as the optimal predictive model, further efforts were made to streamline the input indicators. Based on their importance, indicators were incrementally added to the model. As shown in <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref>, using 15 important parameters as input led to the desired results. With an increase in the input parameters, the RMSE, MAE, and R<sup>2</sup> values no longer exhibited significant changes, which might be due to the substantial collinearity among the input parameters, as the information coverage did not significantly improve with additional input indicators. Early analysis of input variables to reduce autocorrelation effects appears to have positive effects on model prediction (<xref ref-type="bibr" rid="B12">Han et&#xa0;al., 2019</xref>).</p>
<p>Moreover, an in-depth analysis of the final selection of 15 indicators, as shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>, revealed that the importance of SMEs was the highest, exceeding 30%. Previous research has indicated an association between textural parameters and plant photosynthesis (<xref ref-type="bibr" rid="B13">Heckmann et&#xa0;al., 2017</xref>). Our experimental design included two planting modes, soybean monoculture and strip intercropping, which magnified the impact of light conditions on soybean yield. Consequently, the importance of textural parameters became more prominent, further confirming our hypothesis. Additionally, the number of selected sideview image indicators far exceeded that of the top-view indicators. This dataset included 12 sideview image indicators (6 textural indicators and 6 morphological indicators) and 3 top-view image indicators (1 textural indicator and 2 morphological indicators). From <xref ref-type="table" rid="T1">
<bold>Tables&#xa0;1</bold>
</xref> and <xref ref-type="table" rid="T2">
<bold>2</bold>
</xref>, it is evident that predictions based on sideview images were better than those based on top-view images, and the selected indicators explain this predictive performance.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Discussion on the performance of the five models</title>
<p>As a branch of artificial intelligence, machine learning technology has found widespread application due to its remarkable ability to integrate complex and dynamic biological knowledge with large-scale omics data (<xref ref-type="bibr" rid="B30">Shahhosseini et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B33">Van Klompenburg et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B27">Paudel et&#xa0;al., 2021</xref>). Machine learning technologies enable the construction of various prediction models and decision algorithms (<xref ref-type="bibr" rid="B36">Yan and Wang, 2022</xref>). As evident from <xref ref-type="table" rid="T2">
<bold>Tables&#xa0;2</bold>
</xref>, <xref ref-type="table" rid="T3">
<bold>3</bold>
</xref>, and <xref ref-type="table" rid="T5">
<bold>5</bold>
</xref>, the GBDT model achieved superior predictive accuracy compared to that of the other four models, consistently exhibiting the same pattern in terms of prediction errors. Therefore, the GBDT model is the optimal model for soybean yield estimation. The inherent advantage of GBDT, which is composed of numerous decision trees, lies in its continuous feature selection and partitioning process, which enhances its fitting capacity to the data (<xref ref-type="bibr" rid="B38">Zhang et&#xa0;al., 2023</xref>). GBDT achieves sample data classification by progressively reducing the residuals generated during the training process, significantly improving the data-fitting capabilities (<xref ref-type="bibr" rid="B38">Zhang et&#xa0;al., 2023</xref>).</p>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Prediction of yield based on side- and top-image parameters.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" rowspan="2" colspan="2" align="center"/>
<th valign="top" colspan="3" align="center">S1</th>
<th valign="top" colspan="3" align="center">S2</th>
<th valign="top" colspan="3" align="center">S3</th>
</tr>
<tr>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
<th valign="top" align="center">RMSE<break/>(%)</th>
<th valign="top" align="center">MAE<break/>(g/per)</th>
<th valign="top" align="center">R<sup>2</sup>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">CatBoost</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">5.00</td>
<td valign="bottom" align="center">3.80</td>
<td valign="bottom" align="center">0.69</td>
<td valign="bottom" align="center">5.34</td>
<td valign="bottom" align="center">4.10</td>
<td valign="bottom" align="center">0.65</td>
<td valign="bottom" align="center">4.75</td>
<td valign="bottom" align="center">3.66</td>
<td valign="bottom" align="center">0.75</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">5.89</td>
<td valign="bottom" align="center">4.43</td>
<td valign="bottom" align="center">0.55</td>
<td valign="bottom" align="center">5.91</td>
<td valign="bottom" align="center">0.49</td>
<td valign="bottom" align="center">0.54</td>
<td valign="bottom" align="center">0.69</td>
<td valign="bottom" align="center">4.26</td>
<td valign="bottom" align="center">0.61</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">LightBoost</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">1.25</td>
<td valign="bottom" align="center">0.86</td>
<td valign="bottom" align="center">0.95</td>
<td valign="bottom" align="center">1.86</td>
<td valign="bottom" align="center">1.30</td>
<td valign="bottom" align="center">0.92</td>
<td valign="bottom" align="center">0.98</td>
<td valign="bottom" align="center">0.65</td>
<td valign="bottom" align="center">0.99</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">4.17</td>
<td valign="bottom" align="center">2.52</td>
<td valign="bottom" align="center">0.77</td>
<td valign="bottom" align="center">4.46</td>
<td valign="bottom" align="center">2.90</td>
<td valign="bottom" align="center">0.73</td>
<td valign="bottom" align="center">4.26</td>
<td valign="bottom" align="center">2.26</td>
<td valign="bottom" align="center">0.79</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">GBDT</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">1.20</td>
<td valign="bottom" align="center">0.92</td>
<td valign="bottom" align="center">0.93</td>
<td valign="bottom" align="center">1.32</td>
<td valign="bottom" align="center">1.20</td>
<td valign="bottom" align="center">0.91</td>
<td valign="bottom" align="center">0.92</td>
<td valign="bottom" align="center">0.72</td>
<td valign="bottom" align="center">0.97</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">3.01</td>
<td valign="bottom" align="center">2.11</td>
<td valign="bottom" align="center">0.8</td>
<td valign="bottom" align="center">2.88</td>
<td valign="bottom" align="center">2.04</td>
<td valign="bottom" align="center">0.78</td>
<td valign="bottom" align="center">3.12</td>
<td valign="bottom" align="center">1.99</td>
<td valign="bottom" align="center">
<bold>0.82</bold>
</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">RF</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">0.71</td>
<td valign="bottom" align="center">1.28</td>
<td valign="bottom" align="center">0.94</td>
<td valign="bottom" align="center">0.69</td>
<td valign="bottom" align="center">1.78</td>
<td valign="bottom" align="center">0.93</td>
<td valign="bottom" align="center">0.79</td>
<td valign="bottom" align="center">1.21</td>
<td valign="bottom" align="center">0.97</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">0.60</td>
<td valign="bottom" align="center">4.11</td>
<td valign="bottom" align="center">0.75</td>
<td valign="bottom" align="center">0.55</td>
<td valign="bottom" align="center">4.51</td>
<td valign="bottom" align="center">0.74</td>
<td valign="bottom" align="center">0.65</td>
<td valign="bottom" align="center">4.25</td>
<td valign="bottom" align="center">0.79</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">MLP</td>
<td valign="bottom" align="center">Val</td>
<td valign="bottom" align="center">5.00</td>
<td valign="bottom" align="center">3.80</td>
<td valign="bottom" align="center">0.69</td>
<td valign="bottom" align="center">6.02</td>
<td valign="bottom" align="center">4.64</td>
<td valign="bottom" align="center">0.55</td>
<td valign="bottom" align="center">3.42</td>
<td valign="bottom" align="center">2.59</td>
<td valign="bottom" align="center">0.87</td>
</tr>
<tr>
<td valign="bottom" align="center">Cal</td>
<td valign="bottom" align="center">5.89</td>
<td valign="bottom" align="center">4.43</td>
<td valign="bottom" align="center">0.55</td>
<td valign="bottom" align="center">5.75</td>
<td valign="bottom" align="center">4.37</td>
<td valign="bottom" align="center">0.59</td>
<td valign="bottom" align="center">4.84</td>
<td valign="bottom" align="center">3.55</td>
<td valign="bottom" align="center">0.74</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Val for the validation set, Cal for the test set. The bold font represents the optimal predicted values.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The overall prediction performance of the MLP model is relatively poor. This is attributed to the model&#x2019;s network structure, which includes multiple hidden layers, and each &#x201c;neuron&#x201d; is connected to all nodes in the preceding layer. This structure results in many parameters, making training challenging. However, with sufficient computational power and training data, the MLP performance can be significantly enhanced. This finding aligns with the results of our study, where an increase in the input parameters led to a noticeable improvement in the MLP prediction performance, reaching a maximum R<sup>2</sup> value of 0.74.</p>
<p>In this study, there are likely two reasons for the low predictive accuracy of the CatBoost model. First, due to the soybeans being grown in the field and influenced by field conditions, the growth status of each soybean plant is not very standardized (it may tilt, bend, break at the top, etc.; see <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>), leading to many outliers. Although this study used the outlier test function in the car package to remove outliers, there is still a possibility of incomplete removal, which affects the predictive accuracy of the CatBoost model. Second, this study referred to the methods of predecessors and conducted preliminary screening of input parameters using absolute correlation (<xref ref-type="bibr" rid="B37">Yu and Liu, 2003</xref>; <xref ref-type="bibr" rid="B9">Cui et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B25">Ma et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B22">Li et&#xa0;al., 2023</xref>). However, it is possible that setting the screening threshold too low (Cor &gt; 0.5) retained some indicators with weaker relationships, which had a certain impact on the predictive accuracy of the model. Therefore, in future research, more screening criteria should be added on the basis of correlations to enhance the initial screening of indicators. In the context of machine learning, heritability may not be a direct factor influencing algorithm selection, but it does affect the nature of the data and the structure of the feature space, thereby indirectly influencing the selection and performance of machine learning algorithms. In this study, the broad-sense heritability of soybean yield was 0.621. Therefore, when selecting machine learning algorithms, features with complex genetic mechanisms may have more diverse and nonlinear distributions. Algorithms capable of handling nonlinear relationships and complex patterns, such as support vector machines or decision trees, may be more suitable.</p>
<p>In general, as the richness of the indicators increases, the prediction accuracy improves, and the errors decrease. When using single-angle indicators as the input parameters, sideview indicators lead to significantly better performance than top-view indicators. When single-type indicators are used as the input parameters, the morphological parameters lead to better performance than the textural parameters from the sideview, while the textural parameters lead to better performance than the morphological parameters from the top view. We speculate that this phenomenon is due to the abundance of effective morphological parameters extracted from sideview images, whereas the top view provides a more intuitive view of young and tender soybean leaves. Therefore, sideview morphological parameters and top-view textural parameters are more critical for estimating soybean single-plant yield.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Future directions</title>
<p>In this study, five machine learning algorithms were employed to estimate soybean yield. The results indicate that RGB images can be used to accurately estimate soybean yield. This research contributes to the identification of a high-throughput and nondestructive method for estimating soybean yield, accelerating the screening of germplasm and breeding materials.</p>
<p>Despite extracting as many indicators as possible in this study to estimate the final yield parameters, the information inherently contained in RGB images is limited, leaving room for further improvement in terms of the estimation accuracy. However, this study, which was based on data from 240 soybean varieties, two treatments, and two years of field data, benefitted from a large dataset, making our conclusions more applicable to real-world scenarios and highly credible. Future research could consider adding sensor types and enriching phenotypic parameters, thereby enhancing the prediction accuracy and reducing errors. Additionally, due to limited throughput and substantial workload, only images from the R6 stage were collected for analysis in this study. Subsequent research could involve image collection throughout the entire growth period to determine the earliest stage for accurate soybean yield estimation, further shortening the breeding process.</p>
<p>Finally, it is worth noting that selecting the best predictive model requires considering multiple factors comprehensively. Key factors include data characteristics such as scale, number and type of features, distribution, problem nature such as regression or classification, order or unordering, model characteristics such as interpretability, training speed, overfitting and underfitting, and resource constraints such as computation and time. For example, when dealing with many features, tree-based algorithms (such as GBDT and RF) may perform well because they can effectively handle high-dimensional data. For features with complex relationships, neural networks may be more effective. For regression problems, linear regression, decision tree regression, or GBDT may be good choices; for classification problems, logistic regression, support vector machine (SVM), RF, or deep neural networks may be more suitable. Additionally, it is important to evaluate model performance and select appropriate metrics through cross-validation. Therefore, there is no universally best model, and it is necessary to try multiple models and optimize them based on specific circumstances.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>This study concludes with two main findings: (1) The optimal input parameters were determined to be SME, SGD, SG, SDM, TSC, SPA2, SGE1, SSC, 4/5MW, TG, SRRA, SE, 3/5MW, TRH, and 2/5MW, totaling 15 indicators. (2) Among the five machine learning models, GBDT emerged as the best model for predicting soybean yield, achieving a maximum accuracy of 0.82. Therefore, this combination of parameters extracted from RGB images and machine learning has significant potential for estimating soybean yield parameters.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>XL: Conceptualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Data curation, Visualization. MC: Data curation, Writing &#x2013; original draft. SH: Conceptualization, Writing &#x2013; review &amp; editing. XX: Visualization, Writing &#x2013; original draft. LH: Validation, Writing &#x2013; review &amp; editing. LW: Validation, Writing &#x2013; review &amp; editing. YG: Software, Writing &#x2013; review &amp; editing. FT: Software, Writing &#x2013; review &amp; editing. TG: Software, Writing &#x2013; review &amp; editing. WW: Supervision, Writing &#x2013; review &amp; editing. MX: Supervision, Writing &#x2013; review &amp; editing. CL: Supervision, Writing &#x2013; review &amp; editing. LY: Resources, Writing &#x2013; review &amp; editing. WL: Funding acquisition, Writing &#x2013; review &amp; editing. WY: Writing &#x2013; review &amp; editing, Resources.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This work was supported by the Molecular mechanism of relay intercropping light environment regulating shade-tolerant plant architecture formation in soybean (32172122), the Major Project on Agricultural Biotechnology Breeding under the Technology Innovation 2030 Initiative (2022ZD04007), the Key Research and Development Project of the Guizhou Branch of China National Tobacco Corporation (2023XM18), the National Modern Agricultural Industry Technology System, Sichuan Bean Miscellaneous Grain Innovation Team, soybean germplasm resource collection and evaluation post expert (SC-CXTD-2020-20).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2024.1395760/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2024.1395760/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Presentation_1.zip" id="SF1" mimetype="application/zip"/>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aghelpour</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Varshavian</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Forecasting different types of droughts simultaneously using multivariate standardized precipitation index (MSPI), MLP neural network, and imperialistic competitive algorithm (ICA)</article-title>. <source>Complexity</source> <volume>2021</volume>, <fpage>1</fpage>&#x2013;<lpage>16</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1155/2021/6610228</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bai</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Estimation of soybean yield parameters under lodging conditions using rgb information from unmanned aerial vehicles</article-title>. <source>Front. Plant Sci.</source> <volume>13)</volume>, <elocation-id>1012293</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.1012293</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bharati</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.J.</given-names>
</name>
<name>
<surname>MacGregor</surname> <given-names>J. F.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Image texture analysis: methods and comparisons</article-title>. <source>Chemometrics intelligent Lab. Syst.</source> <volume>72</volume>, <fpage>57</fpage>&#x2013;<lpage>71</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chemolab.2004.02.005</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <source>Random forests[J]. Machine learning</source>. <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brinkhoff</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Dunn</surname> <given-names>B. W.</given-names>
</name>
<name>
<surname>Dunn</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The influence of nitrogen and variety on rice grain moisture content dry-down</article-title>. <source>Field Crops Res.</source> <volume>302</volume>, <fpage>109044</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fcr.2023.109044</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Niyogi</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improving the forecasting of winter wheat yields in northern China with machine learning&#x2013;dynamical hybrid subseasonal-to-seasonal ensemble prediction</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>1</fpage>&#x2013;<lpage>17</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14071707</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Penuelas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>McCabe</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Atzberger</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Jiao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Combining multi-indicators with machine-learning algorithms for maize yield early prediction at the county-level in China</article-title>. <source>Agric. For. Meteorology</source> <volume>323</volume>, <fpage>109057</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.agrformet.2022.109057</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chiozza</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Parmley</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Higgins</surname> <given-names>R. H.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Miguez</surname> <given-names>F. E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Comparative prediction accuracy of hyperspectral bands for different soybean crop variables: From leaf area to seed composition</article-title>. <source>Field Crops Res.</source> <volume>271)</volume>, <fpage>108260</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fcr.2021.108260</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Cui</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>Q</given-names>
</name>
</person-group> (<year>2010</year>). <conf-name>Correlation-based feature selection and regression[C]//Pacific-Rim Conference on Multimedia</conf-name>. <conf-loc>Springer-Verlag</conf-loc>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-642-15702-8_3</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Luck</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Alfalfa yield prediction using UAV-based hyperspectral imagery and ensemble learning</article-title>. <source>Remote Sens.</source> <volume>12</volume>, <fpage>2028</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs12122028</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilliot</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Michelin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hadjard</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Houot</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>An accurate method for predicting spatial variability of maize yield from UAV-based plant height estimation: a tool for monitoring agronomic field experiments</article-title>. <source>Precis. Agric.</source> <volume>6</volume>, <fpage>1</fpage>&#x2013;<lpage>25</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11119-020-09764-w</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>B</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Modeling maize above-ground biomass based on machine learning approaches using UAV remote-sensing data</article-title>. <source>Plant Methods</source> <volume>15</volume>, <fpage>1</fpage>&#x2013;<lpage>19</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13007-019-0394-z</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heckmann</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Schl&#xfc;ter</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Weber</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Machine learning techniques for predicting crop photosynthetic capacity from leaf reflectance spectra</article-title>. <source>Mol. Plant</source> <volume>10</volume>, <fpage>878</fpage>&#x2013;<lpage>890</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.molp.2017.04.009</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1984</year>). <article-title>Texture analysis method of grayscale-gradient symbiosis matrix</article-title>. <source>Acta Automatica Sin.</source> <volume>01</volume>, <fpage>22</fpage>&#x2013;<lpage>25</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.16383/j.aas.1984.01.005</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Qiao</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Experimental study of airborne thermal infrared camera applied to agricultural drought monitoring</article-title>. <source>J. Capital Normal University: Natural Sci. Edition</source> <volume>38</volume>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.19789/j.1004-9398.2017.03.016</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <source>FPGA implementation of ECG identity recognition algorithm based on convolutional neural network</source> (<publisher-name>Jilin University</publisher-name>).</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hughes</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Askew</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Scotson</surname> <given-names>C. P.</given-names>
</name>
<name>
<surname>Williams</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Sauze</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Corke</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Non-destructive, high-content analysis of wheat grain traits using X-ray micro computed tomography</article-title>. <source>Plant Methods</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>16</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13007-017-0229-8</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ji</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Cheng</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Estimation of plant height and yield based on UAV imagery in faba bean (Vicia faba L)</article-title>. <source>Plant Methods</source> <volume>18</volume>, <fpage>26</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13007-022-00861-7</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Winter wheat yield estimation based on multi-source medium resolution optical and radar imaging data and the AquaCrop model using the particle swarm optimization algorithm</article-title>. <source>Isprs J. Photogrammetry Remote Sens.</source> <volume>126</volume>, <fpage>24</fpage>&#x2013;<lpage>37</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2017.02.001</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khalifani</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Darvishzadeh</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Azad</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Rahmani</surname> <given-names>R. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction of sunflower grain yield under normal and salinity stress by RBF, MLP and, CNN models</article-title>. <source>Ind. Crops Products</source> <volume>189)</volume>, <fpage>115762</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.indcrop.2022.115762</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Crop yield forecasting and associated optimum lead time analysis based on multi-source environmental data across China</article-title>. <source>Agric. For. Meteorology</source> <volume>308</volume>, <fpage>108558</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.agrformet.2021.108558</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>He</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>Soybean leaf estimation based on RGB images and machine learning methods</article-title>. <source>Plant Methods</source> <volume>19</volume>, <fpage>59</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13007-023-01023-z</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2020</year>). <source>Root cause localization application of abnormal faults based on CatBoost model</source> (<publisher-name>Lanzhou University</publisher-name>).</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Xue</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improved estimation of coalbed methane content using the revised estimate of depth and CatBoost algorithm: A case study from southern Sichuan Basin, China</article-title>. <source>Comput. Geosciences</source> <volume>158)</volume>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cageo.2021.104973</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Cotton yield estimation based on vegetation indices and texture features derived from RGB image</article-title>. <source>Front. Plant Sci.</source> <volume>13)</volume>, <elocation-id>925986</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.925986</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Paswan</surname> <given-names>R. P.</given-names>
</name>
<name>
<surname>Begum</surname> <given-names>S. A.</given-names>
</name>
</person-group> (<year>2013</year>). &#x201c;<article-title>MLP for prediction of area and rice production of upper Brahmaputra Valley zone of Assam</article-title>,&#x201d; in <conf-name>2013 Fourth International Conference on Computing, Communications and Networking Technologies (ICCCNT)</conf-name>. <fpage>1</fpage>&#x2013;<lpage>9</lpage> (<publisher-name>IEEE</publisher-name>).</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paudel</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Boogaard</surname> <given-names>H.</given-names>
</name>
<name>
<surname>de Wit</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Janssen</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Osinga</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Pylianidis</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Machine learning for large-scale crop yield forecasting</article-title>. <source>Agric. Syst.</source> <volume>187)</volume>, <fpage>103016</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.agsy.2020.103016</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname> <given-names>T.-H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.-Y.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.-H.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>D.-P.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Improving photosynthetic performance and yield of summer soybean by organic fertilizer application and increasing plant density</article-title>. <source>J. Plant Nutr. Fertilizers</source> <volume>27</volume>, <fpage>1361</fpage>&#x2013;<lpage>1375</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.11674/zwyf.2021010"10.11674/zwyf.2021010</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seireg</surname> <given-names>H. R.</given-names>
</name>
<name>
<surname>Omar</surname> <given-names>Y. M.</given-names>
</name>
<name>
<surname>El-Sayed</surname> <given-names>F.</given-names>
</name>
<name>
<surname>El-Fishawy</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Elmahalawy</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Cascading ensemble machine learning algorithms for maize yield level prediction</article-title>. <source>Menoufia J. Electronic Eng. Res.</source> <volume>32</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.21608/mjeer.2023.159995.1066</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shahhosseini</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Archontoulis</surname> <given-names>S. V.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Forecasting corn yield with machine learning ensembles</article-title>. <source>Front. Plant Sci.</source> <volume>11)</volume>, <elocation-id>527890</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.01120</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Gradient boosting with piece-wise linear regression trees</article-title>. <source>[J]. arXiv preprint arXiv</source>. <page-range>1802.05640</page-range>. doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1802.05640</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of end-of-season tuber yield and tuber set in potatoes using in-season UAV-based hyperspectral imagery and machine learning</article-title>. <source>Sensors</source> <volume>20</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s20185293</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Klompenburg</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Kassahun</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Catal</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Crop yield prediction using machine learning: A systematic literature review</article-title>. <source>Comput. Electron. Agric.</source> <volume>177)</volume>, <elocation-id>105709</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105709</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Shang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>UAV- and machine learning-based retrieval of wheat SPAD values at the overwintering stage for variety screening</article-title>. <source>Remote Sens.</source> <volume>5166</volume>, <fpage>1</fpage>&#x2013;<lpage>20</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13245166</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yamaguchi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Tanaka</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Imachi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yamashita</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Katsura</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Feasibility of combining deep learning and RGB images obtained by unmanned aerial vehicle for leaf area index estimation in rice</article-title>. <source>Remote Sens.</source> <volume>13</volume>, <fpage>84</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13010084</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Machine learning bridges omics sciences and plant breeding</article-title>. <source>Trends Plant Sci.</source> <volume>23</volume>, <fpage>1</fpage>&#x2013;<lpage>12</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.tplants.2022.08.018</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Yu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Feature Selection for High-Dimensional Data: A Fast Correlation-Based Filter Solution[J]. Springer Publishing Company, Incorporated</article-title>, doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-319-21858-8</pub-id>.</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>H.-Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>Z.-Z.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J.-M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.-Z.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>K.-D.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Extraction of planting structure of winter wheat using GBDT and google earth engine</article-title>. <source>Spectrosc. And Spectral Anal.</source> <volume>43</volume>, <fpage>597</fpage>&#x2013;<lpage>607</lpage>.</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Research progress on soybean leaf development</article-title>. <source>Seed Technol.</source> <volume>39</volume>, <fpage>13</fpage>&#x2013;<lpage>14</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.19904/j.cnki.cn14-1160/s.2021.18.004</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>