<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1103276</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Unstructured road extraction and roadside fruit recognition in grape orchards based on a synchronous detection algorithm</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Xinzhao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2087599"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zou</surname>
<given-names>Xiangjun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2158137"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tang</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2146132"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yan</surname>
<given-names>Zhiwei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Meng</surname>
<given-names>Hewei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Luo</surname>
<given-names>Xiwen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Mechanical and Electrical Engineering, Shihezi University</institution>, <addr-line>Shihezi</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Foshan-Zhongke Innovation Research Institute of Intelligent Agriculture</institution>, <addr-line>Foshan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Foshan Sino-tech Industrial Technology Research Institute</institution>, <addr-line>Foshan</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>College of Engineering, South China Agricultural University</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Guangdong Provincial Key Laboratory of Agricultural Artificial Intelligence (GDKL-AAI)</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Long He, The Pennsylvania State University (PSU), United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Uzair Aslam Bhatti, Hainan University, China; Kai Huang, Jiangsu Academy of Agricultural Sciences, China; Itsuki Kunita, University of the Ryukyus, Japan</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Hewei Meng, <email xlink:href="mailto:mhw_mac@126.com">mhw_mac@126.com</email>; Xiwen Luo, <email xlink:href="mailto:xwluo@scau.edu.cn">xwluo@scau.edu.cn</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>02</day>
<month>06</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1103276</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>11</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>05</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Zhou, Zou, Tang, Yan, Meng and Luo</copyright-statement>    <copyright-year>2023</copyright-year>
<copyright-holder>Zhou, Zou, Tang, Yan, Meng and Luo</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Accurate road extraction and recognition of roadside fruit in complex orchard environments are essential prerequisites for robotic fruit picking and walking behavioral decisions. In this study, a novel algorithm was proposed for unstructured road extraction and roadside fruit synchronous recognition, with wine grapes and nonstructural orchards as research objects. Initially, a preprocessing method tailored to field orchards was proposed to reduce the interference of adverse factors in the operating environment. The preprocessing method contained 4 parts: interception of regions of interest, bilateral filter, logarithmic space transformation and image enhancement based on the MSRCR algorithm. Subsequently, the analysis of the enhanced image enabled the optimization of the gray factor, and a road region extraction method based on dual-space fusion was proposed by color channel enhancement and gray factor optimization. Furthermore, the YOLO model suitable for grape cluster recognition in the wild environment was selected, and its parameters were optimized to enhance the recognition performance of the model for randomly distributed grapes. Finally, a fusion recognition framework was innovatively established, wherein the road extraction result was taken as input, and the optimized parameter YOLO model was utilized to identify roadside fruits, thus realizing synchronous road extraction and roadside fruit detection. Experimental results demonstrated that the proposed method based on the pretreatment could reduce the impact of interfering factors in complex orchard environments and enhance the quality of road extraction. Using the optimized YOLOv7 model, the precision, recall, mAP, and F1-score for roadside fruit cluster detection were 88.9%, 89.7%, 93.4%, and 89.3%, respectively, all of which were higher than those of the YOLOv5 model and were more suitable for roadside grape recognition. Compared to the identification results obtained by the grape detection algorithm alone, the proposed synchronous algorithm increased the number of fruit identifications by 23.84% and the detection speed by 14.33%. This research enhanced the perception ability of robots and provided a solid support for behavioral decision systems.</p>
</abstract>
<kwd-group>
<kwd>non-structural environment</kwd>
<kwd>machine vision</kwd>
<kwd>fruit harvesting robot</kwd>
<kwd>deep learning</kwd>
<kwd>roadside fruits detection</kwd>
</kwd-group>    <contract-num rid="cn001">2022DB004</contract-num>    <contract-num rid="cn002">2120001008424</contract-num>    <contract-num rid="cn003">2022A1515140162, 2022A1515140013</contract-num>    <contract-sponsor id="cn001">Science and Technology Bureau of Xinjiang Production and Construction Corps<named-content content-type="fundref-id">10.13039/501100021193</named-content>
</contract-sponsor>    <contract-sponsor id="cn002">Foshan Science and Technology Bureau<named-content content-type="fundref-id">10.13039/501100011478</named-content>
</contract-sponsor>    <contract-sponsor id="cn003">Guangdong Science and Technology Department<named-content content-type="fundref-id">10.13039/501100007162</named-content>
</contract-sponsor>
<counts>
<fig-count count="13"/>
<table-count count="2"/>
<equation-count count="19"/>
<ref-count count="90"/>
<page-count count="22"/>
<word-count count="10710"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Technical Advances in Plant Science</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Around the world, fruit plays an increasingly vital role in agriculture and economy. According to Food and Agriculture Organization of the United Nations (FAO), the total value of grape production has increased steadily since 1991, to more than $80 billion by 2020. Fruit harvesting is characterized by having limited work cycles and being labor intensive and time-consuming. With aging of the population and lack of rural labor force, labor costs have increased year by year (<xref ref-type="bibr" rid="B74">Wu et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B30">Li Y. J. et&#xa0;al., 2022</xref>). Under the influence of the COVID-19 pandemic and related policies (<xref ref-type="bibr" rid="B1">Aamir et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B45">Nawaz et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B4">Bhatti et&#xa0;al., 2022a</xref>; <xref ref-type="bibr" rid="B5">Bhatti et&#xa0;al., 2022b</xref>), the contradiction between labor demand and labor costs has become more prominent (<xref ref-type="bibr" rid="B35">Liang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B37">Lin et&#xa0;al., 2022</xref>). This has had a negative impact on traditional hand-picking operations. With the deterioration of environmental issues (<xref ref-type="bibr" rid="B3">Bhatti et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B16">Galvan et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B59">Tang et&#xa0;al., 2023a</xref>), all the above factors pose a great challenge to China&#x2019;s fruit industry. With the rapid development of modern information technology and artificial intelligence technology, fruit harvesting robots and their related technologies have attracted extensive attention (<xref ref-type="bibr" rid="B10">Chen M. et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B13">Fu L. H. et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B14">Fu L. et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B53">Rysz and Mehta, 2021</xref>; <xref ref-type="bibr" rid="B79">Yang, 2021</xref>; <xref ref-type="bibr" rid="B26">Kang et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B69">Wang X. et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B75">Wu Z. et&#xa0;al., 2022</xref>).</p>
<p>As the basis of autonomous navigation, road detection is crucial to the precise operation of fruit harvesting robots and has become the focus of research in recent years (<xref ref-type="bibr" rid="B43">Ma et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B58">Sun et&#xa0;al., 2022</xref>). The main objective of road extraction is to extract the road regions from the background in a complex scene to lay the foundation for determining the navigation path. According to the characteristics of roads, they can be divided into two categories: structured roads and unstructured roads. Structured roads are standardized roads similar to urban roads and expressways, with clear lane markings, regular road edges, and distinct geometric features. Unstructured roads are those with irregular road edges, unclear road boundaries, no lane lines, and similar to orchards and rural areas. Compared to structured roads, unstructured roads have a more complex environmental background. For the most part, the surface of the unstructured road is mostly uneven, with a few random weeds. In contrast, the problem of unstructured road extraction is more complicated.</p>
<p>Research of road detection is usually divided into machine learning segmentation methods and traditional algorithms based on image features.</p>
<p>Road segmentation methods of machine learning are mainly divided into clustering (<xref ref-type="bibr" rid="B87">Zhang Z. Q. et&#xa0;al., 2022b</xref>), seed support vector machine (SVM; <xref ref-type="bibr" rid="B39">Liu et&#xa0;al., 2018</xref>), deep learning (<xref ref-type="bibr" rid="B32">Li et&#xa0;al., 2020</xref>), and other methods. <xref ref-type="bibr" rid="B80">Yang Z. et&#xa0;al. (2022)</xref> have proposed a visual navigation path extraction method based on neural network and pixel scanning. They introduced Segnet and Unet networks to improve the segmentation effect of orchard road condition information and background environment and adopted sliding filtering algorithm, a scanning method, and a weighted average method to fit the final navigation path. <xref ref-type="bibr" rid="B29">Lei et&#xa0;al. (2021)</xref> have combined improved SVM and two-dimensional lidar point cloud data to detect and identify unstructured roads. <xref ref-type="bibr" rid="B65">Wang E. et&#xa0;al. (2019)</xref> have realized road extraction of complex scenes by combining illumination invariant images and analyzing probability map and gradient information. <xref ref-type="bibr" rid="B28">Kim et&#xa0;al. (2020)</xref> have implemented automatic path detection in semi-structured orchards based on patch and CNN neural network methods. <xref ref-type="bibr" rid="B2">Alam et&#xa0;al. (2021)</xref> have implemented road extraction in structured and unstructured environments by combining multi-nearest neighbor classification and soft voting aggregation. Some scholars have also studied methods for road extraction in remote sensing based on machine learning methods (<xref ref-type="bibr" rid="B76">Xin et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B18">Guan et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B81">Yang M. et&#xa0;al., 2022</xref>). However, relevant research has been more on the basis of urban development analysis or traffic network monitoring and other fields, which are not applicable to picking robots. Machine learning usually does not require manual feature selection. However, this method requires specific network training and a large number of training sets and has certain limitations.</p>
<p>In the method based on image-feature analysis, some scholars use color, texture and other features to distinguish road and nonroad areas by establishing models and other methods. <xref ref-type="bibr" rid="B90">Zhou et&#xa0;al. (2021)</xref> have used the H component to extract the target path for the sky region. <xref ref-type="bibr" rid="B8">Chen J et&#xa0;al. (2020</xref>; <xref ref-type="bibr" rid="B7">2021)</xref> have used an improved gray scale factor and the maximum interclass variance method (Otsu) method to extract gray scale images of soil and plants and realized segmentation of soil and plants in the greenhouse environment. <xref ref-type="bibr" rid="B50">Qi et&#xa0;al. (2019)</xref> have segmented the road region based on a graph-based manifold ranking approach and used binomial functions to fit the road region model, thus realizing road recognition in rural environment. Some scholars have also considered the vanishing point and other spatial structure features in the process of road extraction. <xref ref-type="bibr" rid="B57">Su et&#xa0;al. (2019)</xref> have adopted the Dijkstra method combined with single-line lidar to realize road extraction on the basis of the constraints of pre-vanishing points of illumination-invariant images. <xref ref-type="bibr" rid="B48">Phung et&#xa0;al. (2016)</xref> have realized pedestrian lane detection based on an improved vanishing point estimation method combined with geometry and color features. However, the detection of vanishing points is time-consuming and mostly applied to structured road detection (<xref ref-type="bibr" rid="B77">Xu et&#xa0;al., 2018</xref>), which is not suitable for dealing with unstructured roads.</p>
<p>To realize autonomous walking and precise operation of fruit harvesting robots in orchard environments and aiming at the uncertainty of random distribution of roadside fruit and road complexity, it is necessary to deeply study the problem of synchronous road extraction and fruit identification. This study enables robot perception of barrier-free road areas and roadside fruit distribution in the current environment and can provide an inferential basis for robot global operational behavior decisions in complex orchard environments. Moreover, this study can lay the foundation for the joint control and operation of navigation and picking based on visual guidance in the panoramic environment of wild orchards. However, current approaches have only focused on road extraction, without considering the roadside fruit detection. In this case, the autonomous decision-making function of the robot cannot perform reasonable picking responses and navigation path planning based on the random distribution of fruits along the road, which is detrimental to the intelligent global continuous operation of the robot.</p>
<p>In terms of object detection, neural networks have been widely used in the field of smart agriculture (<xref ref-type="bibr" rid="B27">Khaki and Wang, 2019</xref>; <xref ref-type="bibr" rid="B60">Tang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B12">Feng et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B15">Fu et&#xa0;al., 2022</xref>), and You Only Look Once (YOLO), as one of the fastest target detection models at present, has also been rapidly developed (<xref ref-type="bibr" rid="B82">Ye et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B46">Ning et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B69">Wang X. Y. et&#xa0;al., 2022</xref>). For example, due to the excellent performance of the YOLOv5 model in terms of accuracy and running time, it has been greatly valued by scholars in the research of crop growth-morphology recognition (<xref ref-type="bibr" rid="B41">Lv et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B51">Rong et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B73">Wu F. et&#xa0;al., 2022</xref>), detection and positioning (<xref ref-type="bibr" rid="B11">Fang et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B24">Jintasuttisak et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B31">Li G. et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B70">Wang H. et&#xa0;al., 2022</xref>), tracking counting (<xref ref-type="bibr" rid="B42">Lyu et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B55">She et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B83">Zang et&#xa0;al., 2022</xref>), and pest recognition (<xref ref-type="bibr" rid="B33">Li S. et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B49">Qi et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B85">Zhang et&#xa0;al., 2022</xref>).</p>
<p>Given the importance of detecting and locating fruit for picking robots, researchers have explored various fruit detection and location methods based on neural networks (<xref ref-type="bibr" rid="B67">Wang C. et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B17">Ge et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B23">Jia et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B89">Zhou et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B62">Tang et&#xa0;al., 2023c</xref>). To improve the operational efficiency and success rate of picking robots, researchers have gradually shifted their focus to picking-path planning algorithms and picking decision systems based on fruit detection (<xref ref-type="bibr" rid="B38">Lin et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B66">Wang Y. et&#xa0;al., 2022</xref>). For example, <xref ref-type="bibr" rid="B78">Xu et&#xa0;al. (2022)</xref> have proposed an efficient combined multipoint picking scheme for tea buds through a greedy algorithm and ant colony algorithm, which improved picking efficiency and overall picking success rate. <xref ref-type="bibr" rid="B46">Ning et&#xa0;al. (2022)</xref> proposed a method for recognition and planning robotic picking sequences for sweet peppers based on an improved YOLOV4 model and a principle of anticollision picking within picking clusters. The method can accurately detects sweet peppers, reduces collision damage, and improves picking efficiency in high-density orchard environments. <xref ref-type="bibr" rid="B51">Rong et&#xa0;al. (2022)</xref> have proposed an obstacle avoidance method that combines end-effector grasping-pose adjustment and harvesting sequence planning based on a custom manipulator. Experiments show that the method significantly reduced the impact of collision on the picking and improved the success rate of tomato picking. Although some progress has been made in the study of local target detection and picking planning, there have been few reports on the synchronization information perception needs of picking robots to autonomously pick and walk.</p>
<p>To implement the behavioral decision-making function of the picker robot to walk autonomously and pick accurately throughout the entire process in a large-area orchard environment, road extraction and roadside fruit identification should first be implemented in the current working scenario. Currently, many algorithms only focus on road extraction and ignore the fruit distribution along the road, which leads to the serious problem that picking robots are not robust enough to adapt to the changing orchard environments. Therefore, a road extraction and roadside fruit synchronous recognition algorithm based on unstructured road was proposed in this study. The main contributions of this study were as follows:</p>
<list list-type="simple">
<list-item>
<p>(1) Currently, numerous studies have focused on extracting unstructured roads without considering the synchronous recognition of roadside fruits, which is detrimental to improving the ability of picking robots to obtain environmental information. Motivated by the need for cooperative behavioral decision-making in fruit picking robots, this study proposed a framework for unstructured road extraction and synchronous recognition of roadside fruit. This framework can effectively improve the ability of fruit-picking robots to extract crucial information from the picking environment and lay a foundation for multitask parallel processing, thereby enabling cooperative behavioral decision-making among fruit-picking robots.</p>
</list-item>
<list-item>
<p>(2) Due to the randomness and complexity of orchard environments, the results of road extraction directly from raw images were not very accurate and contained a large number of misidentified regions. An image preprocessing method based on image enhancement and filtering preprocessing was designed here which reduced the influence of interference existing in the complex orchard environment. Simultaneously, this approach enhanced the precision of road extraction results and was of great importance for improving the quality of road extraction.</p>
</list-item>
<list-item>
<p>(3) The irregular road edges of unstructured roads and various interference factors in orchards considerably impacted the stability of the road extraction results. To address this issue, analyses of orchard images were conducted to optimize the gray factor and enhance its adaptability to field orchards. A two-space fusion unstructured road extraction algorithm was proposed, which used color channel enhancement and gray factor optimization and demonstrated great adaptability to interference factors, such as shadow, uneven lighting, grapevine on the side of the road, and strong contrast between light and shade in the field complex environment.</p>
</list-item>
<list-item>
<p>(4) A fusion algorithm based on the road extraction algorithm and roadside fruit detection algorithm was constructed. Based on the detection requirements for roadside grapes in wide-field environments, YOLO models were compared, selected, and optimized for their parameters. Subsequently, the three functions of image preprocessing, road extraction, and roadside grape recognition were integrated to construct a synchronous recognition algorithm, allowing for the simultaneous extraction of road and other key information during the fruit-picking process. The proposed algorithm provided information for decision-making and reasoning of collaborative behavior of key parts of the robot, so as to improve robot adaptability to randomly distributed fruit.</p>
</list-item>
</list>
<p>This study will lay a foundation for the construction of robot behavior decision control system, and it is of great significance for improving the intelligence, accuracy, and stability of robot field autonomous work.</p>
<p>The rest of this report is organized as follows. Section 2 introduced the materials and data. Section 3 explained the structure and implementation of the algorithm. Section 4 presented the experimental results and comparative discussion. Finally, Section 5 summarized the study and plans for future work.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Materials and data acquisition</title>
<sec id="s2_1">
<label>2.1</label>
<title>Experimental platform for wine grape picking and moving</title>
<p>This study was based on the wine grape visual mobile picking robot that was independently designed and developed. The overall layout of the test platform is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1A</bold>
</xref>. The test platform was battery powered to operate in the orchard. The length and width of the platform were 1.065 and 0.7 m, respectively, and the maximum climbing capacity was 30&#xb0;. Two cameras were installed on the end-effector of the platform as picking camera and navigation camera, separately.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Overall layout and control flow of test platform. <bold>(A)</bold> Overall layout of test platform. Mechanical arm (AUBO-i5, AUBO), 1; Battery, 2; Controller, 3; Camera for picking (HBV-1714, Huiber Vision Technology Co., Ltd), 4; Camera for navigation (ZED 2, Stereolabs), 5; End-effector, 6; Human Machine Interaction, 7; Industrial Personal Computer (IPC), 8; and Track car, 9. <bold>(B)</bold> Control flow of the test platform.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g001.tif"/>
</fig>
<p>The control process of the experimental platform was divided into three main parts (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1B</bold>
</xref>). The first part of the control system was to construct algorithms for unstructured road extraction and roadside fruit synchronization recognition based on the collected datasets A and B. Then, the industrial personal computer (IPC) implemented the algorithm-based key information acquisition, recognition, and behavioral decisions. The second part of the control system was to use the IPC to control the navigation camera for orchard road extraction and roadside fruit recognition. By recognizing the distinction between unstructured roads and chaotic backgrounds, as well as the classification and recognition of roadside grapes and grapevines, it provided a judgment basis for the IPC to distinguish the presence of roadside fruit and lay the foundation for behavioral decisions. Based on the above information, the third part of the control system extracted the navigation path of the orchard and judged the presence of fruit in the current roadside area. If there were fruit on the roadside, the controller controlled the tracked vehicle to approach the fruit area of the roadside fruit tree and fed the information to the robotic arm and another set of stereo camera for precise positioning (the picking camera for short) for picking operations. Using the picking camera, fruit could be re-identified and accurately positioned to achieve fruit picking in complex environments. The work of this study mainly implemented the first part of the control system.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Experimental subjects</title>
<p>Wine grapes and non-structural orchards were taken as experiment subjects in this research. Wine grape fruit are clustered in shape and usually purple at maturity, with a clear color difference from leaves. The planting mode is usually in rows with a certain row spacing. As the fruit distribution and planting patterns of wine grapes are similar to other row-grown crops, such as tomato and dragon fruit, the results of this study are expected to be extendable to other types of fruit.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Image acquisition</title>
<p>In August 2022, experimental images were obtained from Xinyu Winehouse (Bohu County, Bazhou, Xinjiang). The device used for dataset sampling was an OPPO R11 mobile phone with a 20-megapixel rear camera. All images were taken under natural daylight conditions without artificial light sources and saved in Joint Photographic Expert Group (jpg) format with image size 4608&#xd7;2128 pixels.</p>
<p>The collected images were divided into datasets A and B. The original images of vineyards in dataset A included roads and vines. As the algorithm proposed in this study was intended to provide a basis for behavioral decisions of grape-picking robots, the focus was on the region of unstructured road and distribution of fruit in a unilateral grape row. Therefore, during the collection process of dataset A, the camera observation direction was biased to the right of the road center line (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). A total of 337 typical orchard images were selected, in which the roads in the grape orchard environment had features of shadow and irregular road edges (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Dataset B was composed of 1081 valid images showing wine grape clusters, including grape samples in numerous cases, with images of grapes in front and backlight (<xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2C, D</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Schematic diagram of the acquisition process of test images. <bold>(A)</bold> The camera observation direction. <bold>(B)</bold> Example image of the wine vineyard. <bold>(C)</bold> Examples of frontlight images. <bold>(D)</bold> Examples of backlight images.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g002.tif"/>
</fig>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Image datasets</title>
<p>To simulate the vision system of the picking robot, valid grape and orchard image samples were collected under different conditions of illumination, weather, sampling distance, and differing severity of fruit adhesion and occlusion, forming datasets A and B.</p>
<p>Dataset A consisted mainly of orchard images with uneven lighting, with multiple weeds, with large shadows, in different weather conditions, and with different light and shade contrasts (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Natural images of vineyards and wine grape clusters. <bold>(A)</bold> Natural images of vineyards. <bold>(B)</bold> Natural images of wine grape clusters.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g003.tif"/>
</fig>
<p>The natural images of grapes (dataset B) mainly included images of single cluster grape, multiple clusters grape, slightly-adhered grape, severely-adhered grapes, front and back illumination, small string grapes, large cluster grapes, and grapes on a sunny day, on a cloudy day, and in shadow as well as grapes at different sampling distances. Their representative images are shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>.</p>
<p>Datasets A and B were challenging considering the effects of complex background, light levels, shadows, randomly distributed fruits, weeds, and different levels of fruit occlusion. Images of grapes and vineyards in a typical complex environment were contained in dataset A and B (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>).</p>
<p>Dataset A was only employed for testing the performance of unstructured road extraction and the overall algorithm, with 100 images in this dataset randomly selected as the test set for algorithms in this study. To improve algorithm efficiency, the processing image size of the algorithm was set to 1024&#xd7;473 pixels.</p>
<p>Dataset B was used for training and validation of the fruit model on the YOLOv7 roadside. Under LabelImg (<ext-link ext-link-type="uri" xlink:href="https://github.com/tzutalin/labelImg">https://github.com/tzutalin/labelImg</ext-link>), grapes in images were manually annotated as rectangles with the label &#x201c;fruit,&#x201d; which then saved annotation files in &#x201c;txt&#x201d; format. Among them, the whole image set was randomly divided into training and validation sets with a ratio of 9 to 1.</p>
</sec>
</sec>
<sec id="s3">
<label>3</label>
<title>Methodology and algorithm description</title>
<p>In this study, the algorithm content was mainly divided into two parts: First, the road in the unstructured orchard environment was extracted. Second, taking the road extraction results as input, roadside fruit were identified through YOLOv7 to realize the synchronous information extraction of the road extraction and roadside fruit detection. The algorithm process of this study is shown in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Flow chart of the entire algorithm.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g004.tif"/>
</fig>
<sec id="s3_1">
<label>3.1</label>
<title>Image preprocessing</title>
<p>During image acquisition in the orchard, it was inevitable to be disturbed by external environmental noise, such as uneven light and dust, which made the image details unclear and led to road extraction errors. Therefore, this study preprocessed the images in dataset A, which was of great significance for improving the quality of road segmentation (<xref ref-type="bibr" rid="B64">Wang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B84">Zhang P. et&#xa0;al., 2022</xref>). The image preprocessing method proposed in this study consisted of five steps, with the processing procedure and image quality enhancement results illustrated in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>. Further details can be found in Sections 3.3.1 - 3.1.5.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Process and results of image preprocessing algorithm. <bold>(A)</bold> Original image. <bold>(B)</bold> Region of interest. <bold>(C)</bold> Bilateral filtering result. <bold>(D)</bold> Log space transformation. <bold>(E)</bold> Image enhancement based on the MSRCR algorithm. <bold>(F)</bold> S-component enhancement. <bold>(G)</bold> Results of image preprocessing algorithm.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g005.tif"/>
</fig>
<sec id="s3_1_1">
<label>3.1.1</label>
<title>Interception of regions of interest</title>
<p>The images in dataset A were composed of sky, road, grapes, and messy background, among which the sky and messy background were mainly distributed at the top of an image. In the image processing process, if the entire image captured by the camera was merely taken as the research object, a substantial amount of computation would be required and a significant amount of interference inevitably occurs, which will reduce road extraction accuracy. To this end, only the regions of interest (ROI) of the image was extracted for subsequent processing. After a number of experiments, it was found that the appropriate ROI was at the lower 5/6 position of the image (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). This ROI selection not only significantly reduced the calculation volume, but also ensured the accuracy and reliability of unstructured road extraction.</p>
</sec>
<sec id="s3_1_2">
<label>3.1.2</label>
<title>Bilateral filter</title>
<p>A bilateral filter can smooth the image while maintaining edge details (<xref ref-type="bibr" rid="B52">Routray et&#xa0;al., 2020</xref>). To enhance and improve contrast between the foreground and background of the road to facilitate subsequent segmentation, a bilateral filter was used to process the present images. To reduce the influence of minor areas, such as vines, fruits, vine gaps, and cavities in subsequent segmentation, the key parameters of the bilateral filter (<xref ref-type="bibr" rid="B40">Liu et&#xa0;al., 2017</xref>) in this study were set to: diameter <italic>d</italic> of the pixel domain was 60, standard deviation of spatial domain 120, and standard deviation of intensity domain 60 (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>).</p>
</sec>
<sec id="s3_1_3">
<label>3.1.3</label>
<title>Logarithmic space transformation</title>
<p>To enhance the details in the shadowed regions and provide images with enhanced details and uniform brightness for subsequent MSRCR processing, a logarithmic transformation of the V-component in hue, saturation, and value (HSV) space was used here to expand the low gray values and compress high gray values in this channel (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5D</bold>
</xref>). The standard form was</p>
<disp-formula>
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>S</italic> is the correction image, <italic>L</italic> the source image, and <italic>c</italic> the gain adjustment parameter, which was set to 1.</p>
</sec>
<sec id="s3_1_4">
<label>3.1.4</label>
<title>Image enhancement based on the MSRCR algorithm</title>
<p>After the above processing and observing the image under RGB color space, the altering influence of illumination was found not to be entirely eliminated. Therefore, the MSRCR algorithm was selected for image correction and enhancement here to obtain realistic images with reduced illumination effects. The resulting Equations 2&#x2013;4 were expressed as:</p>
<disp-formula>
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>R</mml:mi>
<mml:mi>C</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c6;</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>log</mml:mi>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:munderover>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2217;</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi>&#x3b2;</mml:mi>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The optimal functional form of MSRCR is shown in Equation 5, expressed as:</p>
<disp-formula>
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>R</mml:mi>
<mml:mi>C</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mi>G</mml:mi>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:mi>log</mml:mi>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mi>log</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mstyle>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mi>b</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im1">
<mml:mrow>
<mml:msub>
<mml:mi>I</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is the color component image corresponding to each color channel, <inline-formula>
<mml:math display="inline" id="im2">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> the Gaussian filter function, and <inline-formula>
<mml:math display="inline" id="im3">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> the color restoration factor of the <italic>i</italic>
<sup>th</sup> color channel, <inline-formula>
<mml:math display="inline" id="im4">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c6;</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the weight, and <italic>N</italic> the number of spectral channel, where <inline-formula>
<mml:math display="inline" id="im5">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3c6;</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</inline-formula>, <italic>&#x3b2;</italic> a gain constant, and <italic>&#x3b1;</italic> the strength of nonlinearity, <italic>G</italic> and <italic>b</italic> the final gain and offset values, respectively. The parameters of MSRCR in this study were configured according to the reference (<xref ref-type="bibr" rid="B25">Jobson et&#xa0;al., 1997</xref>).</p>
</sec>
<sec id="s3_1_5">
<label>3.1.5</label>
<title>S-component enhancement</title>
<p>To enrich color information, this study adjusted the saturation channel S to enhance image quality, with the formulas described by Equations 6&#x2013;7 (<xref ref-type="bibr" rid="B22">Huang et&#xa0;al., 2022</xref>), expressed as:</p>
<disp-formula>
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
<mml:mo>&#x2217;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mo>&#x2217;</mml:mo>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mtext>ri</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(7)</label>
<mml:math display="block" id="M7">
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>x</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im6">
<mml:mrow>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the enhanced saturation channel, <inline-formula>
<mml:math display="inline" id="im7">
<mml:mrow>
<mml:msub>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mi>o</mml:mi>
<mml:mtext>ri</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the original saturation channel of S, <inline-formula>
<mml:math display="inline" id="im8">
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im9">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>x</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im10">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> the average, maximum, and minimum values of pixels corresponding to R, G, and B color channels, respectively, and <italic>&#x3b1;<sub>s</sub>
</italic> and <italic>T</italic> the gain coefficients of the saturation channel, which control the enhancement degree of S channel image.</p>
<p>Qualitative and quantitative evaluation is significant for the evaluation of image quality. In the qualitative evaluation, the quality of the enhanced image was evaluated in color, contrast, and detail. By comparing the gain effect at different values, it was observed that, if the value of <italic>&#x3b1;<sub>s</sub>
</italic> was too high or low, the image contrast was reduced or saturation too strong, which affected the visual effect of the image. When <italic>&#x3b1;<sub>s</sub>
</italic> = 0.2, the contrast of the image was low, resulting in poor overall visual effect. When <italic>&#x3b1;<sub>s</sub>
</italic> was greater than 0.5, there was significant color distortion despite the high contrast of images, resulting in partial loss of detail in the image. When <italic>&#x3b1;<sub>s</sub>
</italic> = 0.3, although the tone of the image was better maintained, the enhancement effect was not obvious compared with the image without S-component enhancement. When <italic>&#x3b1;<sub>s</sub>
</italic> = 0.4, the contrast of the image was improved significantly without obvious color distortion and the visual effect was the best.</p>
<p>In the quantitative evaluation, this paper evaluated the performance the processing results by three metrics Peak signal-to-noise ratio (PSNR, <xref ref-type="bibr" rid="B21">He et&#xa0;al., 2015</xref>), information entropy value (IE, <xref ref-type="bibr" rid="B68">Wang et&#xa0;al., 2021</xref>) and average gradient (AG, <xref ref-type="bibr" rid="B86">Zhang X. et&#xa0;al., 2022</xref>). PSNR has been widely used for measuring attributes like texture details enhancement, details preservation and contrast enhancement. A higher PSNR generally indicates that the processed image is of higher quality (<xref ref-type="bibr" rid="B20">Gupta and Tiwari, 2019</xref>). IE is mainly an objective evaluation index that measures how much information an image contains. The enormous IE value indicates that the enhancement image contains more image information. AG represents the degree of change in the gray value of the image, and is one of the criteria for judging the processing of image details and clarity. The large AG value indicates that the enhancement image contains more gradient information and detailed texture. The image enhancement quality evaluation parameters under different values of <italic>&#x3b1;<sub>s</sub>
</italic> were shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5F</bold>
</xref>, where the optimal parameter values were marked in red and the second highest parameter values were highlighted in blue. Figure illustrated that the value of AG increased as the value of <italic>&#x3b1;<sub>s</sub>
</italic> increased, indicating that the sharpness of the image was also enhanced progressively. However, color distortion occurred when <italic>&#x3b1;<sub>s</sub>
</italic> was set to 0.5 or 0.6. Therefore, this paper eliminated the enhanced images with these two parameters and only discussed the image enhancement results with low <italic>&#x3b1;<sub>s</sub>
</italic> value(<italic>&#x3b1;<sub>s</sub>
</italic>&lt; 0.5). Moreover, the highest value and the second highest value of PSNR and IE were mainly concentrated in the results of <italic>&#x3b1;<sub>s</sub>
</italic> =0.3 and <italic>&#x3b1;<sub>s</sub>
</italic> =0.4, which indicates that under the above two parameter settings, the images had a good performance in terms of image information, contrast enhancement and detail preservation. Furthermore, for <italic>&#x3b1;<sub>s</sub>
</italic>=0.4, both the IE and AG values were higher than those for <italic>&#x3b1;<sub>s</sub>
</italic>=0.3, while the PSNR was slightly lower than the latter. Therefore, based on the qualitative evaluation results and the requirements of enhanced images in terms of clarity, information content, picture details and contrast, <italic>&#x3b1;<sub>s</sub>
</italic> was finally set at 0.4 in this study.</p>
</sec>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Unstructured road extraction</title>
<p>In this section, unstructured road extraction was achieved by fusing two parts, including the segmented road region after removing green regions from the HSV space and road region based on improved gray factor.</p>
<sec id="s3_2_1">
<label>3.2.1</label>
<title>Road extraction based on color enhancement and HSV color space</title>
<p>HSV color space is composed of hue (H), saturation (S) and luminance (V) channels. As HSV color space is more consistent with human color perception, it has been widely used in multifield research based on machine vision, such as medicine (<xref ref-type="bibr" rid="B56">Singh, 2020</xref>), agriculture (<xref ref-type="bibr" rid="B36">Liao et&#xa0;al., 2022</xref>), and chemical industries (<xref ref-type="bibr" rid="B54">Safarik et&#xa0;al., 2019</xref>). Therefore, the HSV color space was used here to extract road regions.</p>
<p>First, the enhanced and optimized RGB image was converted into an HSV image and the threshold range (H<sub>min</sub>, H<sub>max</sub>), (S<sub>min</sub>, S<sub>max</sub>), and (V<sub>min</sub>, V<sub>max</sub>) of each channel set to binarize the image. This completed the constraint and extraction of the green area, so as to distinguish the road area from the plant area (vines, weeds, and background trees). Based on Exploratory data analysis (EDA) and empirical values (<xref ref-type="bibr" rid="B19">Guo et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B47">Peng et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B6">Camizuli and Carranza, 2018</xref>), the HSV ranges were set at (35,77),(43,255),and (46,255), respectively (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref>). As can be seen from the image, although the road extraction was relatively complete, the main constraint in the HSV space was the green region, such that there were still interference regions due to grapes and their vines, leaf gaps, and other factors in extraction results.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Process and results of road extraction. <bold>(A)</bold> Road extraction results in HSV space. <bold>(B)</bold> Road extraction results based on ExG Gray factor. <bold>(C)</bold> Road segmentation effect under different <italic>T<sub>B</sub>
</italic>. <bold>(D)</bold> Road extraction results based on optimized grayscale factor. <bold>(E)</bold> Fused binary image. <bold>(F)</bold> Morphological processing result. <bold>(G)</bold> Final extraction result. <bold>(H)</bold> Manual image segmentation. <bold>(I)</bold> Results of comparison between proposed algorithm and real situation.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g006.tif"/>
</fig>
</sec>
<sec id="s3_2_2">
<label>3.2.2</label>
<title>Road extraction based on gray factor optimization</title>
<p>Taking advantage of the significant color difference between different objects in the image, numerous researchers have realized object segmentation by examining different gray weights, such as excessive red plant index (ExR, <xref ref-type="bibr" rid="B44">Meyer et&#xa0;al., 1999</xref>), excessive green index (ExG, <xref ref-type="bibr" rid="B72">Woebbecke et&#xa0;al., 1995</xref>), and normalized difference index (NDI, <xref ref-type="bibr" rid="B71">Woebbecke et&#xa0;al., 1993</xref>). The preprocessed image mainly contained four areas: grape vines regions, soil areas, background, and shadow areas. Therefore, through manual segmentation of the above regions and obtaining the average values of R, G, and B in different regions, the gray factor was improved by a heuristic method based on the excessive green index (ExG). The optimized gray factor and its binarized image acquisition formula were expressed in Equations 8 and 9 as</p>
<disp-formula>
<label>(8)</label>
<mml:math display="block" id="M8">
<mml:mrow>
<mml:mi>g</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1.84</mml:mn>
<mml:mi>G</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(9)</label>
<mml:math display="block" id="M9">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mtable>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mn>0</mml:mn>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mn>1.84</mml:mn>
<mml:mi>G</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2264;</mml:mo>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mrow>
<mml:mn>255</mml:mn>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mn>1.84</mml:mn>
<mml:mi>G</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
<mml:mo>&gt;</mml:mo>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>B</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where gray(x,y) is the optimized gray level factor, f(x,y) the binarized image, and G(x,y), B(x,y), and R(x,y) as the green, blue, and red components of the color range, respectively. And <italic>T<sub>B</sub>
</italic> is the binarization threshold.</p>
<p>Based on the optimized grayscale factor, the grayscale image and the grayscale histogram of the enhanced image after the S-component were plotted in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6C</bold>
</xref>. As can be seen from the gray histogram, most pixels in the image had a gray value of 0, corresponding to the majority of black road areas in the gray map. However, as shown by the red area in the grayscale image, a few pixels in the road area had gray values that were not zero. Therefore, the rationality of the binarization threshold <italic>T<sub>B</sub>
</italic> directly affected the integrity of the road segmentation. To determine the optimal binarization threshold, a comparative experiment was conducted in this paper, using the threshold value <italic>T<sub>B</sub>
</italic> as the independent variable and the road segmentation result as the dependent variable. The initial value of the binarization threshold was set to 0, and different binarization thresholds were used to segment the road. The threshold of binarization was increased by 10 for each group until the segmentation result incorrectly included the vine area on the side of the road.</p>
<p>When <italic>T<sub>B</sub>
</italic>= 0, the segmentation result indicated a significantly smaller road area than the actual road. With <italic>T<sub>B</sub>
</italic> set at 10, the vast majority of road area was accurately extracted from the segmentation results. However, when <italic>T<sub>B</sub>
</italic> was increased to 20, while the extracted road area was more comprehensive, there were numerous incorrectly extracted sections. Consequently, for this article, <italic>T<sub>B</sub>
</italic> was established at 10, the road extraction results were shown in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>.</p>
<p>The extraction method of unoptimized gray factor based on ExG was found to be affected by shadows and weeds, resulting in a large number of noise points and holes in the treatment results, and only extracted a small number of road regions (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref>). Thus, the extracted area was significantly smaller than the real value. On the other hand, the improved gray factor method exhibited superior segmentation results for the grapevine area on the road and its surroundings, showing great advantages in the accuracy and integrity of road segmentation (as depicted in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6D</bold>
</xref>). The above results indicated that compared with the unimproved gray factor, the improved gray factor method was more adaptable to unfavorable environmental conditions such as shadows and lighting in the field.</p>
</sec>
<sec id="s3_2_3">
<label>3.2.3</label>
<title>Binary images fusion and morphological processing</title>
<p>By fusing the above two binarized images in <xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6A, D</bold>
</xref>, most of the disturbances (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6E</bold>
</xref>) were eliminated and road edges constrained. The fused results were more consistent with the real situation.</p>
<p>However, there were various tiny noises and irregularly-shaped edges in the fused binary image. Therefore, morphological processing was performed on fused binary images to remove non-correlated structures (<xref ref-type="fig" rid="f6">
<bold>Figures&#xa0;6F, G</bold>
</xref>).</p>
<p>The road edge extracted by this algorithm was found to be in line with the trend of the real road and fundamentally eliminated the vine area on the side of the road (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6I</bold>
</xref>). This reduced the interference of light, shadow, weeds, and dead branches to road extraction, with high extraction integrity and good comprehensive performance.</p>
</sec>
<sec id="s3_2_4">
<label>3.2.4</label>
<title>Performance evaluation indexes</title>
<p>In this study, the number of ROI image pixels (NRP) and the ratio between the wrongly extracted pixels and the number of ROI image pixels (RBP) were used as evaluation indices for verifying the performance of the road extraction algorithm. And the calculation equations of this evaluation index expressed in Equation 10 as</p>
<disp-formula>
<label>(10)</label>
<mml:math display="block" id="M10">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>B</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>W</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>R</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where NWP is the number of wrongly extracted pixels by the algorithm.</p>
</sec>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Roadside fruit detection based on YOLOv7</title>
<sec id="s3_3_1">
<label>3.3.1</label>
<title>Characteristics of the YOLOv7 network structure</title>
<p>As the latest version of the YOLO series (<xref ref-type="bibr" rid="B63">Wang C. et&#xa0;al., 2022</xref>), YOLOv7 has improved the existing model in many ways. First, it offers extended efficient layer aggregation networks (E-ELAN) based on ELAN structure, which can guide different computing blocks to learn more different features and enhance the learning ability of the model on the basis of maintaining the original gradient path. Then, a compound model scaling method based on the cascade model has been proposed to ensure the initial characteristics and optimal structure of the model, which efficiently utilizes parameters and computation. Meanwhile, several trainable bag-of-freebies methods have been designed for real-time object detection, which significantly improves detection accuracy without increasing inference cost. Based on the above improvements, YOLOv7 shows great advantages in terms of speed and accuracy over other detection algorithms. Its network architecture is shown in <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Network structure of YOLOv7.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g007.tif"/>
</fig>
<p>Based on the performance advantages of the YOLOv7 and YOLOv5 models, both models were adopted in this research to detect roadside fruits. The results were compared to identify the roadside grape detection model that is better suited for large-field environments. The selected model&#x2019;s feasibility and detection performance were then further verified for roadside fruit recognition.</p>
</sec>
<sec id="s3_3_2">
<label>3.3.2</label>
<title>Network training and parameter optimization</title>
<p>The experiment was conducted on a Windows 10 operating system, with the Python framework, YOLOv7, and YOLOv5 environments built in the Anaconda environment. The program was written in Python 3.9 and CUDA Ver. 11.7. In terms of hardware, the processor is an Intel (R) Core (R) i5-1240F CPU@2.5 GHz, the dominant frequency is 2.5 GHz, internal storage 32.0 GB, and graphics card an NVIDIA GeForce RTX 3060.</p>
<p>Due to the complex orchard environment, directly applying the default parameters of YOLO model to the roadside fruit recognition model results in poor detection results. To adapt to fruit recognition in complex field scenarios, the learning rate parameter of the YOLO model was chosen as described in this study. The initial value of the learning rate was set to 0.01 and the model was trained with different learning rates. The learning rate of each group was reduced by 0.002, respectively, until the optimal parameters were detected and chosen. By comparison, it was found that when the learning rate was larger than 0.002, the loss curves for object detection in the results suffered from severe oscillations, poor convergence or nonconvergence. Thus, the learning rate of the wine grape orchard recognition model was set to 0.002.</p>
<p>The training and verification sets were input into the network for training, with a batch size of 16 and 150 epochs, respectively (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>YOLO basic parameters.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Parameters of model</th>
<th valign="middle" align="center">Value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Input image resolution</td>
<td valign="middle" align="center">640&#xd7;640</td>
</tr>
<tr>
<td valign="middle" align="center">Learning rate</td>
<td valign="middle" align="center">0.002</td>
</tr>
<tr>
<td valign="middle" align="center">Momentum</td>
<td valign="middle" align="center">0.937</td>
</tr>
<tr>
<td valign="middle" align="center">Optimizer weight decay</td>
<td valign="middle" align="center">0.0005</td>
</tr>
<tr>
<td valign="middle" align="center">Warmup momentum</td>
<td valign="middle" align="center">0.8</td>
</tr>
<tr>
<td valign="middle" align="center">Batch size</td>
<td valign="middle" align="center">16</td>
</tr>
<tr>
<td valign="middle" align="center">Training epochs</td>
<td valign="middle" align="center">150</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3_3_3">
<label>3.3.3</label>
<title>Model evaluation</title>
<p>In this study, precision (P), recall (R), F1-score, and <italic>mAP</italic> were used as the evaluation indices of roadside fruit detection performance and the calculation equations of each evaluation index expressed in Equations 11&#x2013;14 as:</p>
<disp-formula>
<label>(11)</label>
<mml:math display="block" id="M11">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(12)</label>
<mml:math display="block" id="M12">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(13)</label>
<mml:math display="block" id="M13">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mn>1</mml:mn>
<mml:mo>-</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>R</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(14)</label>
<mml:math display="block" id="M14">
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mi>c</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mi>c</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>TP</italic>, <italic>FP</italic>, and <italic>FN</italic> correspond to true positives (there is a grape bunch in the image and the algorithm predicts it correctly), false positives (there are no grapes in the image, but the algorithm detects it), and false negatives (the algorithm failed to detect a bunch of grapes which are actually in the image), respectively, and <italic>C</italic> the number of detection classes. As only one kind of fruit was identified in this study, <italic>C</italic> = 1.</p>
</sec>
</sec>
</sec>
<sec id="s4">
<label>4</label>
<title>Experiments and discussion</title>
<p>By achieving synchronous recognition of road extraction and roadside fruit, this algorithm can considerably improve the ability of robots to perceive critical information in the orchard environments and lay the foundation for autonomous walking and picking decisions based on machine vision. Therefore, the performance of this algorithm was extremely critical for the robot&#x2019;s picking rate, navigation path extraction accuracy, and reliability of the decision system in subsequent researches. At the same time, this study served as a reference for other research in the same field.</p>
<p>In this section, the performance of image enhancement, road extraction, roadside fruit recognition, and overall fusion algorithm were verified and discussed.</p>
<sec id="s4_1">
<label>4.1</label>
<title>Road extraction effects and ablation tests</title>
<sec id="s4_1_1">
<label>4.1.1</label>
<title>Road extraction results and analysis</title>
<p>To validate the image segmentation effect of the proposed road extraction algorithm, the results obtained by fused segmentation were compared with those obtained by the conventional color image method. This study adopted two traditional algorithms: a method based on S component and Otsu and another based on the Excess Green index (ExG) and Otsu. At the same time, 25 images with pavement shadows, strong illumination variations, and grapevines with different degrees of color were selected as test samples to verify the adaptability of the above algorithms to complex environments.</p>
<p>The results of multiple sample images were compared, in which samples were original color images and other images obtained by segmentation methods. The comparative findings for partial sample images were illustrated in <xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8A&#x2013;F</bold>
</xref>, while the comparative results for additional images could be found in the <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. <xref ref-type="fig" rid="f1">
<bold>Figures&#xa0;1</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref> depict the image samples with the lowest NWP value in the outcomes of Methods C, D, and E, while <xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4</bold>
</xref>&#x2013;<xref ref-type="fig" rid="f6">
<bold>6</bold>
</xref> depict the image samples with the highest NWP value in the outcomes of Methods C, D, and E, respectively.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Results and analysis of different segmentation methods. <bold>(A)</bold> Original images. <bold>(B)</bold> Manual image segmentation. <bold>(C)</bold> Proposed algorithm. <bold>(D)</bold> Method based on S component and Otsu. <bold>(E)</bold> Method based on EXG and Otsu. <bold>(F)</bold> Error area results extracted by different methods. <bold>(G)</bold> RBP values of partial images obtained by different methods. <bold>(H)</bold> Descriptive Statistics for NWP and RBP. <bold>(I)</bold> NWP values of 25 images obtained by different methods.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g008.tif"/>
</fig>
<p>For simplicity, the proposed algorithm was abbreviated as &#x201c;Method C&#x201d;, the method based on S component and Otsu was abbreviated as &#x201c;Method D&#x201d;, and the method based on EXG and Otsu was abbreviated as &#x201c;Method E&#x201d;.</p>
<p>In the qualitative evaluation, the quality of different segmentation methods was assessed based on the completeness of road segmentation and the distribution of error areas. Due to the complexity of the field orchard, the primary environmental factors that influence the precision of road segmentation outcomes include the grapevine area, shadowed road area (<xref ref-type="bibr" rid="B34">Li et&#xa0;al., 2018</xref>), roadside unevenly colored area, and high contrast between light and dark areas (<xref ref-type="bibr" rid="B61">Tang et&#xa0;al., 2023b</xref>). As depicted in <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8A</bold>
</xref>, strong lighting caused the grapevine areas on the roadside to exhibit characteristics such as uneven light and shade and varying color tones. This led to a significant contrast between light and shade in the grapevine areas on both sides of the road. Additionally, different lighting angles resulted in distinct areas of shadow on the road surface, thereby increasing the complexity involved in segmenting orchard roads.</p>
<p>Observationally, it was found that the extraction results of methods D and E (<xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8D, E</bold>
</xref>) suffered from problems, such as the large area errors in identification. Although the extraction results were of great completeness, the results also contained a large number of incorrect regions (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8F</bold>
</xref>). By comprehensive comparison, the road obtained by the Method C was found to be the closest to the real situation and had the best segmentation effect among all considered methods.</p>
<p>To further analyze the adaptability of the above method to complex vineyard scenarios, the extraction results of the proposed algorithm were compared with real roads (<xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8F, G</bold>
</xref>). Based on <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8F</bold>
</xref>, it can be observed that the error areas of methods D and E were primarily concentrated in the grapevine area on the side of the road.</p>
<p>Method D was found to be sensitive to changes in brightness, shade, and color uniformity of the grapevine region in the image, which resulted in changes in the error area of the segmentation result (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8D</bold>
</xref>). Due to the unpredictable and random nature of illumination in field environments, it was difficult to guarantee the accuracy and stability of the segmentation results achieved through method D.</p>
<p>The primary error source of method E was the grapevine area with strong contrast between light and shade, with the dark part of it being incorrectly identified as the road area. This greatly reduced the accuracy of the segmentation result. When the area of the dark region of the grapevine on the side of the road was small, the error rate of this algorithm decreased significantly. However, when faced with areas that had uneven colors on the side of the road, the error area of the segmentation result achieved through this method was significantly smaller than that of method D.</p>
<p>Conversely, Method C adapted to the aforementioned unfavorable factors, resulting in a smaller error in the segmented area, more stable road extraction performance, and the most reliable segmentation results among the three methods. Combined with the above analysis, the influence degree of unfavorable factors on the accuracy and reliability of the results obtained through different methods was comprehensively evaluated, as presented in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Analysis of the influence degree of adverse factors on algorithms and extraction results.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="6" align="center">Degree of influence of adverse factors on algorithm accuracy</th>
</tr>
<tr>
<th valign="middle" rowspan="2" align="center">Adverse environmental factors</th>
<th valign="middle" colspan="5" align="center">Impact degree</th>
</tr>
<tr>
<th valign="middle" colspan="3" align="center">Method C</th>
<th valign="middle" align="center">Method D</th>
<th valign="middle" align="center">Method E</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Grapevine area</td>
<td valign="middle" colspan="3" align="center">Minor</td>
<td valign="middle" align="center">Severity</td>
<td valign="middle" align="center">Severity</td>
</tr>
<tr>
<td valign="middle" align="center">Shadowed road area</td>
<td valign="middle" colspan="3" align="center">Minor</td>
<td valign="middle" align="center">Minor</td>
<td valign="middle" align="center">Minor</td>
</tr>
<tr>
<td valign="middle" align="center">Roadside unevenly colored area</td>
<td valign="middle" colspan="3" align="center">Minor</td>
<td valign="middle" align="center">Severity</td>
<td valign="middle" align="center">Medium</td>
</tr>
<tr>
<td valign="middle" align="center">Strong contrast between light &amp; dark</td>
<td valign="middle" colspan="3" align="center">Minor</td>
<td valign="middle" align="center">Severity</td>
<td valign="middle" align="center">Severity</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">Methods</td>
<td valign="middle" colspan="5" align="center">Descriptive Statistics for NWP</td>
</tr>
<tr>
<td valign="middle" colspan="2" align="center">Minimum</td>
<td valign="middle" align="center">Maximum</td>
<td valign="middle" align="center">Mean</td>
<td valign="middle" align="center">Std. Deviation</td>
</tr>
<tr>
<td valign="middle" align="center">Method C</td>
<td valign="middle" colspan="2" align="center">8506</td>
<td valign="middle" align="center">36831</td>
<td valign="middle" align="center">19967.040</td>
<td valign="middle" align="center">8425.727</td>
</tr>
<tr>
<td valign="middle" align="center">Method D</td>
<td valign="middle" colspan="2" align="center">73428</td>
<td valign="middle" align="center">194780</td>
<td valign="middle" align="center">139663.16</td>
<td valign="middle" align="center">33567.358</td>
</tr>
<tr>
<td valign="middle" align="center">Method E</td>
<td valign="middle" colspan="2" align="center">41264</td>
<td valign="middle" align="center">214634</td>
<td valign="middle" align="center">96580.960</td>
<td valign="middle" align="center">36276.122</td>
</tr>
<tr>
<td valign="middle" colspan="6" align="center">Pairwise Comparisons of Methods (NWP)</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">
<italic>Sig</italic>
</td>
<td valign="middle" colspan="3" align="center">Method C vs Method D</td>
<td valign="middle" align="center">Method C vs Method E</td>
<td valign="middle" align="center">Method D vs Method E</td>
</tr>
<tr>
<td valign="middle" colspan="3" align="center">&lt;0.001</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.008</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">Methods</td>
<td valign="middle" colspan="5" align="center">Descriptive Statistics for RBP/%</td>
</tr>
<tr>
<td valign="middle" colspan="2" align="center">Minimum</td>
<td valign="middle" align="center">Maximum</td>
<td valign="middle" align="center">Mean</td>
<td valign="middle" align="center">Std. Deviation</td>
</tr>
<tr>
<td valign="middle" align="center">Method C</td>
<td valign="middle" colspan="2" align="center">2.11</td>
<td valign="middle" align="center">9.15</td>
<td valign="middle" align="center">4.959</td>
<td valign="middle" align="center">2.092</td>
</tr>
<tr>
<td valign="middle" align="center">Method D</td>
<td valign="middle" colspan="2" align="center">18.24</td>
<td valign="middle" align="center">48.37</td>
<td valign="middle" align="center">34.684</td>
<td valign="middle" align="center">8.336</td>
</tr>
<tr>
<td valign="middle" align="center">Method E</td>
<td valign="middle" colspan="2" align="center">10.25</td>
<td valign="middle" align="center">53.30</td>
<td valign="middle" align="center">23.9847</td>
<td valign="middle" align="center">9.009</td>
</tr>
<tr>
<td valign="middle" colspan="6" align="center">Pairwise Comparisons of Methods (RBP)</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">
<italic>Sig</italic>
</td>
<td valign="middle" colspan="3" align="center">Method C vs Method D</td>
<td valign="middle" align="center">Method C vs Method E</td>
<td valign="middle" align="center">Method D vs Method E</td>
</tr>
<tr>
<td valign="middle" colspan="3" align="center">&lt;0.001</td>
<td valign="middle" align="center">&lt;0.001</td>
<td valign="middle" align="center">0.008</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To quantitatively evaluate the extraction performance of the above methods, NWP and RBP were taken as indices to achieve a road extraction performance evaluation of different algorithms, where NRP = 402,668 (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>; <xref ref-type="fig" rid="f8">
<bold>Figures&#xa0;8H, I</bold>
</xref>). To determine the differences in road extraction performance among the three methods, the non-parametric Kruskal-Wallis test was conducted across the three groups using SPSS software version 27 (IBM Corporation). The significance level was set at 0.05. The null hypothesis in this test is that there is no difference between the three methods in terms of the distribution of NWP and RBP. In fact, for this test, the <italic>Sig</italic> values less than 0.05 indicate a significant difference between the groups.</p>
<p>According to the descriptive statistical table of NWP, Method C exhibited a generally low overall level of NWP value (<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8H</bold>
</xref>). Comparing the mean value of NWP across the three methods, it was found that the mean value of NWP for Method C accounted for only 14.3% and 20.67% of the mean value of NWP for Methods D and E, respectively. Furthermore, the maximum and minimum values of NWP for Method C were one order of magnitude smaller than those of Methods D and E. Additionally, the standard deviation of NWP value for Method C was significantly lower than that of Methods D and E, indicating that the road extraction performance of Method C was more stable in the face of variable field interference factors. This observation was also validated in <xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8I</bold>
</xref>, which illustrates that the NWP of Method C exhibits a relatively mild fluctuation in comparison to the other two methods. Moreover, the Kruskal-Wallis test results showed that the NWP values of Methods C and D (<italic>Sig</italic>&lt;0.01), Methods C and E (<italic>Sig</italic>&lt;0.01) and Methods D and E (<italic>Sig</italic> = 0.008)were statistically significant difference. Furthermore, it was confirmed that there were substantial differences in the accuracy of road extraction among the three methods.</p>
<p>Similar results were obtained from the descriptive statistical table of RBP. Method C demonstrated favorable outcomes in terms of the maximum, minimum, mean, and standard deviation of RBP. Thereinto, Method C had an RBP of no more than 9.15%, whereas Method D had an RBP of no more than 48.37%, and Method E had a notably high RBP of 53.30%. The above data suggested that the wrongly identified pixels in the road extraction results of Method C only constituted a small portion of the current image. Compared to the other two methods, Method C was found to deliver better segmentation results for road recognition in the field environment and exhibited greater adaptability to the complex environmental interference factors in the field orchard.</p>
</sec>
<sec id="s4_1_2">
<label>4.1.2</label>
<title>Ablation test</title>
<p>To verify the improvement of the image enhancement algorithm on the overall performance of the road extraction algorithm, an ablation experiment was conducted. The comparative findings for a selection of sample images were illustrated in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>, while the comparative results for additional images could be found in the <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. For simplicity, the proposed algorithm without preprocessing was abbreviated as &#x201c;Method F&#x201d;.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Ablation test results from the proposed preprocessing method. <bold>(A)</bold> Original images. <bold>(B)</bold> Proposed algorithm. <bold>(C)</bold> Proposed algorithm without preprocessing. <bold>(D)</bold> Error area results extracted by proposed algorithm. <bold>(E)</bold> Error area results extracted by proposed algorithm without preprocessing. <bold>(F)</bold> Descriptive Statistics and significance analysis result. <bold>(G)</bold> NWP values of 25 images obtained by methods C and F.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g009.tif"/>
</fig>
<p>Ablation experiments were conducted on the proposed preprocessing method. The extraction results after pretreatment were shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9B</bold>
</xref> and the algorithm results without pretreatment were shown in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9C</bold>
</xref>. By comparing the two extraction results, the latter extraction results were found to contain a large number of error regions, such as dark grape vines area, grapes, and other objects on the roadside (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9E</bold>
</xref>). This phenomenon was confirmed by NWP descriptive statistics (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9F</bold>
</xref>).</p>
<p>Based on <xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9F, G</bold>
</xref>, it can be observed that the majority of segmentation results obtained using Method F had a higher NWP value compared to those obtained using Method C. However, a few image processing results showed an opposite result. The reason for this phenomenon can be attributed to the fact that after image preprocessing, the segmentation result of Method C had more stringent restrictions on green areas, resulting in the removal of a large area of weeds from the road in the segmentation results, thereby increasing the NWP value (4th row of <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9C</bold>
</xref>).</p>
<p>After image preprocessing, the accuracy of the algorithm was significantly improved at the cost of a small amount of completeness, which reduced the impact of interference regions, such as road shadows, dark fruits, branches, leaves, and gaps in segmentation accuracy. Meanwhile, the Method C also suppressed the interference of noncurrent road areas on the extracted results and significantly reduced the number of misdetected pixels (3th row of <xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9C, D</bold>
</xref>).</p>
<p>Differences in road extraction performance between the above methods were determined using the non-parametric Mann-Whitney U test. The significance level was set at 0.05. The null hypothesis in this test is that there is no difference between the methods in terms of the distribution of NWP. And the <italic>Sig</italic> values less than 0.05 mean a significant difference between the groups. The Mann-Whitney U test result showed that the NWP values of Methods C and F (<italic>Sig</italic>= 0.03) were statistically significant difference (<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9F</bold>
</xref>).</p>
<p>In conclusion, image preprocessing played a crucial role in enhancing the accuracy and reliability of road segmentation results.</p>
</sec>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Comparison between YOLOv5 and YOLOv7</title>
<p>Target location is an important task in target detection and is normally represented by the coordinate position of the bounding box. The models in this paper used CIoU (<xref ref-type="bibr" rid="B41">Lv et&#xa0;al., 2022</xref>) loss to calculate the boundary frame position loss, which was calculated as follows:</p>
<disp-formula>
<label>(15)</label>    <mml:math display="block" id="M15">
<mml:mrow>
<mml:msub>
<mml:mi>L</mml:mi>
<mml:mrow>
<mml:mi>b</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>I</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>U</mml:mi>
<mml:mo>+</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c1;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mi>c</mml:mi>
<mml:mi>d</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mfrac>
<mml:mo>+</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>&#x3c5;</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(16)</label>
<mml:math display="block" id="M16">
<mml:mrow>
<mml:mi>&#x3c5;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>4</mml:mn>
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c0;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>arctan</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>arctan</mml:mi>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mi>p</mml:mi>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mi>p</mml:mi>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(17)</label>
<mml:math display="block" id="M17">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mi>&#x3c5;</mml:mi>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>+</mml:mo>
<mml:mi>I</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>U</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mi>&#x3c5;</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where <inline-formula>
<mml:math display="inline" id="im11">
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c1;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>B</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is the Euclidean distance of the center points between predicted box and ground truth box, <inline-formula>
<mml:math display="inline" id="im12">
<mml:mrow>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>d</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the diagonal distance of the smallest rectangle containing predicted box and ground truth box, <italic>&#x3b1;</italic> is the weight function, and <inline-formula>
<mml:math display="inline" id="im13">
<mml:mi>&#x3c5;</mml:mi>
</mml:math>
</inline-formula> is the function that measures the consistency of the aspect ratio. <inline-formula>
<mml:math display="inline" id="im14">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im15">
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mi>g</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> are the width and height of the ground truth box, while <inline-formula>
<mml:math display="inline" id="im16">
<mml:mrow>
<mml:msup>
<mml:mi>w</mml:mi>
<mml:mi>p</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula>
<mml:math display="inline" id="im17">
<mml:mrow>
<mml:msup>
<mml:mi>h</mml:mi>
<mml:mi>p</mml:mi>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> are the width and height of the prediction box.</p>
<p>The confidence loss function is used to measure the difference between the confidence score predicted by the model and the actual label. In this paper, the confidence loss function was calculated using a binary cross-entropy loss function (BCELoss, <xref ref-type="bibr" rid="B88">Zhao et&#xa0;al., 2023</xref>), and its formula was as follows:</p>
<disp-formula>
<label>(18)</label>
<mml:math display="block" id="M18">
<mml:mrow>
<mml:msub>
<mml:mi>L</mml:mi>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>f</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>N</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>log</mml:mi>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Where <inline-formula>
<mml:math display="inline" id="im18">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denotes the true category, which generally takes the value of 0 or 1, <inline-formula>
<mml:math display="inline" id="im19">
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> denotes the prediction confidence or target probability obtained by the Sigmoid function, and N is the number of positive and negative samples.</p>
<p>After training, the loss function value curves for the training and validation sets of the two YOLO models were obtained, including the loss values of the detection box and detection object (<xref ref-type="fig" rid="f10">
<bold>Figures&#xa0;10A, B</bold>
</xref>). In <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10A</bold>
</xref>, &#x201c;BOX&#x201d; and &#x201c;Val BOX&#x201d; represented the box loss of the training set and validation set, respectively. In <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10B</bold>
</xref>, &#x201c;Objectness&#x201d; and &#x201c;Val Objectness&#x201d; represented the confidence loss of the training set and validation set, respectively. As shown in <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10A, B</bold>
</xref>, it can be observed that the change trend of the loss curves for both models was similar. In particular, it was observed that the values of box and object detection losses for the two YOLO models decreased sharply during training batches 0 to 20, after which the rate of decline slowed down. The sample distribution ratio of model training set and verification set is shown in <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10D</bold>
</xref>. In addition, the box and the object detection loss values of the YOLOv7 algorithm on the training set were smaller than that of the YOLOv5 algorithm after 150 training epochs. The box detection loss value of YOLOv7 finally stabilized around 0.029 and object detection loss value eventually stabilized around 0.012.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Loss curves and detection results of the two YOLO models. <bold>(A)</bold> Box loss value curve of YOLOv5 and YOLOv7 model. <bold>(B)</bold> Confidence loss function value curve of YOLOv7 model. <bold>(C)</bold> Detection results of YOLOv5 and YOLOv 7 on dataset B. <bold>(D)</bold> Training set and verification set introduction.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g010.tif"/>
</fig>
<p>In addition, although the loss value of box detection in the validation set was slightly higher than that of YOLOv5, the loss value of object detection in the validation set of YOLOv5 showed a trend of fluctuation and rise after 50 training batches. Meanwhile, the loss value of YOLOv7 algorithm decreased steadily and finally the loss value tended to stabilize around 0.0025.</p>
<p>Under the same dataset B, the performance indices of YOLOv7 were better than those of YOLOv5 (<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10C</bold>
</xref>). The P, R, <italic>mAP</italic>, and F1-scores of YOLOv7 were 88.9, 89.7, 93.4, and 89.3%, respectively, which were 3.1, 2.9, 2.7, and 3% higher than from YOLOv5.</p>
<p>Although the number of YOLOv7 targets detected in some images was less than that of YOLOv5, the overall accuracy of the former was higher than that of the latter (<xref ref-type="fig" rid="f11">
<bold>Figures&#xa0;11A&#x2013;C</bold>
</xref>). Moreover, in global images, YOLOv5 showed the phenomenon of grape cluster misidentification (<xref ref-type="fig" rid="f11">
<bold>Figure&#xa0;11</bold>
</xref>, last row). Algorithm detection confidence was the main evaluation metric in this study. In summary, YOLOv7 was able to better perform the task of detecting clusters of grapes in orchards and, hence,YOLOv7 was used to identify grapes on the roadside.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Comparison of partial detection results. <bold>(A)</bold> Original images. <bold>(B)</bold> Identification results of YOLOv5 model. <bold>(C)</bold> Identification results of YOLOv7 model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g011.tif"/>
</fig>
<p>The confidence level of grape clusters recognition results tested by YOLOv7 on dataset B was mostly above 0.8, while it was mostly above 0.5 on dataset A. There were two reasons for this phenomenon. The first was that the grape clusters were smaller on dataset A than those in the training set and the second that dataset A contained a large number of backgrounds, such as sky, trees, and roads, and the overall complexity of the image far greater than that of the training set.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Recognition effects of the synchronous detection algorithm</title>
<p>Furthermore, in order to evaluate the overall detection performance of the synchronous detection algorithm proposed in this paper (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>), simultaneous recognition of the road and roadside fruit was conducted (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12A</bold>
</xref>).</p>
<fig id="f12" position="float">
<label>Figure&#xa0;12</label>
<caption>
<p>Recognition results of overall algorithm and comparison results between proposed algorithm and single YOLOv7 model. <bold>(A)</bold> The overall synchronous detection algorithm recognition results. <bold>(B)</bold> Comparison results of roadside grape clusters identification results between proposed synchronous detection algorithm and single YOLOv7 model. <bold>(C)</bold> Performance comparison between overall synchronous detection algorithm and the single YOLOv7 model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g012.tif"/>
</fig>
<p>The results demonstrate that the algorithm was able to effectively segment the road area despite the complex outdoor environment, and accurately recognize the grapes on the side of the road. This provides valuable information for the intelligent decision-making and control of the robot during subsequent walking and fruit picking operations, and enhances the robot&#x2019;s ability to identify crucial targets within a complex environment.</p>
<p>Furthermore, the synchronous recognition algorithm demonstrated better effectiveness in roadside grape recognition. To validate the positive impact of image preprocessing and road segmentation in the synchronous recognition algorithm on the recognition performance of road test grapes, the images with and without above aforementioned steps were identified using yolov7 model (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12B</bold>
</xref>). The results revealed that, under identical circumstances, the former approach detected more clusters of grapes on the road side.</p>
<p>To further demonstrate the superiority of the proposed synchronous recognition algorithm in roadside grape detection, 66 images from dataset B were used to detect grape clusters. The number of recognized fruits, recognition time and the promotion ratio (<inline-formula>
<mml:math display="inline" id="im20">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) were taken as evaluation parameters. The <inline-formula>
<mml:math display="inline" id="im21">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> was calculated by the following formula.</p>
<disp-formula>
<label>(19)</label>
<mml:math display="block" id="M19">
<mml:mrow>
<mml:msub>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Here, <inline-formula>
<mml:math display="inline" id="im22">
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the evaluation parameters obtained through image calculation based on image preprocessing and road segmentation, while <inline-formula>
<mml:math display="inline" id="im23">
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> represents the evaluation parameters obtained without image preprocessing and road segmentation.</p>
<p>The number of recognized grape clusters in the former was 41 more than that in the latter, representing a 23.84% increase. Additionally, the recognition speed of the former was 0.267 seconds faster than that of the latter, resulting in a speed increase of 14.33%. The results indicated that the images with pre-processing and road segmentation were able to identify more grape clusters and at a faster detection speed compared to the images without pre-processing and road segmentation (refer to <xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12C</bold>
</xref>). This finding provided evidence that the synchronous recognition algorithm proposed in this paper outperforms using YOLOv7 alone for identifying roadside grapes under the same scenario.</p>
<p>The reasons for the above phenomena were as follows: First, due to the extraction and preprocessing of the ROI in the overall algorithm, a large number of backgrounds, such as sky and trees, were eliminated, which improved the proportion of grape cluster pixels in the whole image. In addition, after extracting the road in the image, the interference of the road area on fruit cluster recognition was reduced and grape features more pronounced, which was beneficial for detecting fruit clusters on the roadside.</p>
</sec>
<sec id="s4_4" sec-type="discussion">
<label>4.4</label>
<title>Discussion</title>
<p>Although the unstructured road extraction and roadside fruit synchronous recognition algorithm proposed in this study had good performance, it also had some limitations (<xref ref-type="fig" rid="f13">
<bold>Figures 13A&#x2013;C</bold>
</xref>). First, it was difficult to distinguish the adhesive road areas between different rows during road extraction. For example, when the death of grape plants leads to a large area of vacancy on the road side, the road regions of images consisted of two parts: the road part of the robot&#x2019;s current row and road part of the non-current row (<xref ref-type="fig" rid="f13">
<bold>Figure&#xa0;13C</bold>
</xref>). In this case, it was difficult for the proposed algorithm to distinguish the correct region from the wrong one. At the same time, when there were a large area of weeds near the end of the road with a width of more than 1/2 of the width of the road, the completeness of the extracted results was reduced. Future research will consider optimization algorithms and add constraints to improve result accuracy.</p>
<fig id="f13" position="float">
<label>Figure&#xa0;13</label>
<caption>
<p>Adverse Conditions. <bold>(A)</bold> Original image. <bold>(B)</bold> Result of road extraction. <bold>(C)</bold> Analysis of adverse factors.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1103276-g013.tif"/>
</fig>
<p>In addition, in the process of roadside fruit string identification, there was still a situation of missing grape-cluster detection. Future research will further optimize and improve the network structure for the problems of missing fruit string detection and low confidence of some detection target results.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>In this study, an algorithm for unstructured road extraction and roadside fruit synchronous recognition in a complex orchard environment was developed to address the above issues. The main conclusions could be obtained as follows:</p>
<list list-type="simple">
<list-item>
<p>(1) An unstructured road extraction and roadside fruit synchronous recognition framework was constructed for achieving simultaneous road extraction and roadside fruit detection, which effectively improved the ability of fruit picking robots to extract key information from the picking environment. The algorithm also provided information for decision-making and reasoning of collaborative behavior of key parts of the robot, which improved the adaptability of the robot to randomly distributed fruit.</p>
</list-item>
<list-item>
<p>(2) Based on the analysis of the orchard images, an image enhancement preprocessing method was proposed to reduce the interference of road shadows, dark fruits, branches, and leaves as well as gaps in segmentation results. The method also suppressed the influence of noncurrent road areas on extraction results to a certain extent, which improved result accuracy and reliability.</p>
</list-item>
<list-item>
<p>(3) By enhancing the color channel and optimizing the grayscale factor, the dual spatial fusion road extraction was achieved. Experimental results showed that, compared with the extraction method based on S component and Otsu and extraction method based on EXG and Otsu, the proposed algorithm showed greater adaptability to adverse conditions, such as uneven illumination and road shadows under the background of complex orchards. The proposed road extraction algorithm also largely avoided the problems of missing extraction of real road areas and identification of large area errors, which had the best segmentation effect.</p>
</list-item>
<list-item>
<p>(4) The YOLOv7 and YOLOv5 algorithms, optimized with grape cluster target data, were used to identify roadside grape clusters. The optimized YOLOv7 model achieved a precision of 88.9%, recall of 89.7%, mAP of 93.4%, and F1-score of 89.3%, all of which were higher than those obtained from the YOLOv5 model. Based on this comparison, the YOLOv7 with optimized parameters was found to be more suitable for roadside grape recognition in wide-field views.</p>
</list-item>
<list-item>
<p>(5) The proposed fusion algorithm took the road extraction results as input and then identified fruit strings on the road side. The performance of the proposed fusion algorithm was superior to only using the YOLOv7 model. Compared with the single YOLOv7 model, the number of grape string detections and detection speed of the fusion algorithm were increased by 23.84% and 14.33%.</p>
</list-item>
</list>
<p>Although the new algorithm has achieved satisfactory results, there remains some room for progress. First, due to the similarity between different lines of the roads, the algorithm in this case had difficulty in segmenting the cohesive road area between different lines. At the same time, the completeness of the extraction results was reduced when there were a large area of weeds with a width ratio of 1/2 near the end of the road.</p>
<p>Future work will focus on network structure optimization to improve the accuracy and speed of road extraction and roadside fruit detection algorithms. Constraints between road zones will also been studied to enable the identification and segmentation of road zones between different lines. Furthermore, environment-aware robot behavioral decision control systems will be developed to enable collaborative decision planning and response control of picking and walking operations in complex orchard environments.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>XJZ designed the experiments. WT and ZY carried out the experiments. XZZ designed the study, analyzed the data, and wrote the manuscript. HM and XL supervised and revised the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>This study was supported by the scientific and technological breakthrough plan in key fields of Xinjiang Production and Construction Corps, China (Approval No.2022DB004), Foshan Science and Technology Innovation Project, China (Approval No.2120001008424) and Guangdong Basic and Applied Basic Research Foundation (Approval No.2022A1515140162 and No.2022A1515140013).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1103276/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1103276/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_2.zip" id="SM2" mimetype="application/zip"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aamir</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Bazai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wagan</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Nizamani</surname> <given-names>M. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Spatiotemporal change of air-quality patterns in hubei province-a pre- to post-COVID-19 analysis using path analysis and regression</article-title>. <source>ATMOSPHERE</source> <volume>12</volume> (<issue>10</issue>), <elocation-id>1338</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/atmos12101338</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alam</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jaffery</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Verma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Diwakar</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Distance-based confidence generation and aggregation of classifier for unstructured road detection</article-title>. <source>J. King Saud Univ. - Comput. Inf. Sci</source> <volume>34</volume> (10, Part A), <fpage>8727</fpage>&#x2013;<lpage>8738</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jksuci.2021.09.020</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Nizamani</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>M. X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Climate change threatens pakistan&#x2019;s snow leopards</article-title>. <source>Science</source> <volume>377</volume> (<issue>6606</issue>), <fpage>585</fpage>&#x2013;<lpage>586</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.add9065</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Bazai</surname> <given-names>S. U.</given-names>
</name>
<name>
<surname>Nawaz</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Baryalai</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bhatti</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>a). <article-title>A pre- to post-COVID-19 change of air quality patterns in anhui province using path analysis and regression</article-title>. <source>Polish J. Of Environ. Stud.</source> <volume>31</volume> (<issue>5</issue>), <fpage>4029</fpage>&#x2013;<lpage>4042</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.15244/pjoes/148065</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Zeeshan</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Nizamani</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>Bazai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>b). <article-title>Assessing the change of ambient air quality patterns in jiangsu province of China pre-to post-COVID-19</article-title>. <source>Chemosphere</source> <volume>288</volume>, <elocation-id>132569</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.chemosphere.2021.132569</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Camizuli</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Carranza</surname> <given-names>E. J.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Exploratory data analysis (EDA)</article-title>,&#x201d; in <source>The encyclopedia of archaeological sciences</source>. Ed. <person-group person-group-type="editor">
<name>
<surname>L&#xf3;pez Varela</surname> <given-names>S. L.</given-names>
</name>
</person-group> (<publisher-name>John Wiley &amp; Sons Inc</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>7</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/9781119188230.saseas0271</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Qiang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Navigation path extraction for greenhouse cucumber-picking robots using the prediction-point hough transform</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>180</volume>, <elocation-id>105911</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105911</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Qiang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Extracting the navigation path of a tomato-cucumber greenhouse robot based on a median point hough transform</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>174</volume>, <elocation-id>105472</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105472</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Qiu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>GA-net: a geometry prior assisted neural network for road extraction</article-title>. <source>Int. J. Appl. Earth Observation Geoinformation.</source> <volume>114</volume>, <elocation-id>103004</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jag.2022.103004</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Three-dimensional perception of orchard banana central stock enhanced by adaptive multi-vision technology</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>174</volume>, <elocation-id>105508</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105508</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Single-target detection of oncomelania hupensis based on improved YOLOv5s</article-title>. <source>Front. Bioeng. Biotechnol.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fbioe.2022.861079</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Miao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A vegetable leaf disease identification model based on image-text cross-modal feature fusion</article-title>. <source>Front. In Plant Sci.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.918940</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname> <given-names>L. H.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Fast and accurate detection of banana fruits in complex background orchards</article-title>. <source>IEEE Access.</source> <volume>8</volume>, <fpage>196835</fpage>&#x2013;<lpage>196846</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2020.3029215</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Majeed</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Karkee</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Faster r-CNN-based apple detection in dense-foliage fruiting-wall trees using RGB and depth features for robotic harvesting</article-title>. <source>Biosyst. Engineering.</source> <volume>197</volume>, <fpage>245</fpage>&#x2013;<lpage>256</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biosystemseng.2020.07.007</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Fast detection of banana bunches and stalks in the natural environment based on deep learning</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>194</volume>, <elocation-id>106800</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106800</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galvan</surname> <given-names>L. P. C.</given-names>
</name>
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Campo</surname> <given-names>C. C.</given-names>
</name>
<name>
<surname>Trujillo</surname> <given-names>R. A. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>The nexus between CO2 emission, economic growth, trade openness: evidences from middle-income trap countries</article-title>. <source>Front. In Environ. Sci.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fenvs.2022.938776</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ge</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>From</surname> <given-names>P. J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Three-dimensional location methods for the vision system of strawberry-harvesting robots: development and comparison</article-title>. <source>Precis. Agric</source> <volume>24</volume> (<issue>2</issue>), <fpage>764</fpage>&#x2013;<lpage>782</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11119-022-09974-4</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guan</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Lei</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Marcato</surname> <given-names>J.</given-names>
<suffix>Jr.</suffix>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Road marking extraction in UAV imagery using attentive capsule feature pyramid network</article-title>. <source>Int. J. Appl. Earth Observation Geoinformation.</source> <volume>107</volume>, <elocation-id>102677</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jag.2022.102677</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Color feature analysis and recognition for litchi fruits and their main fruit bearing branch based on exploratory analysis</article-title>. <source>Trans. Chin. Soc. Agric. Engineering.</source> <volume>29</volume> (<issue>4</issue>), <fpage>191</fpage>&#x2013;<lpage>198</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3969/j.issn.1002-6819.2013.04.024</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gupta</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Tiwari</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Color retinal image enhancement using luminosity and quantile based contrast enhancement</article-title>. <source>Multidimensional Syst. Signal Processing.</source> <volume>30</volume> (<issue>4</issue>), <fpage>1829</fpage>&#x2013;<lpage>1837</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11045-019-00630-1</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.-B.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.-L.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>An improved fractional-order differentiation model for image denoising</article-title>. <source>Signal Processing.</source> <volume>112</volume>, <fpage>180</fpage>&#x2013;<lpage>188</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.sigpro.2014.08.025</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Deep unsupervised endoscopic image enhancement based on multi-image fusion</article-title>. <source>Comput. Methods Programs Biomedicine.</source> <volume>221</volume>, <elocation-id>106800</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cmpb.2022.106800</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Accurate segmentation of green fruit based on optimized mask RCNN application in complex orchard</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>, <elocation-id>955256</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.955256</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jintasuttisak</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Edirisinghe</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Elbattay</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Deep neural network based date palm tree detection in drone imagery</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>192</volume>, <elocation-id>106560</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2021.106560</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jobson</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Rahman</surname> <given-names>Z. U.</given-names>
</name>
<name>
<surname>Woodell</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>A multi - scale retinex for bridging the gap between color images and the human observation of scenes</article-title>. <source>Image Processing IEEE Trans. on.</source> <volume>6</volume>, <fpage>965</fpage>&#x2013;<lpage>976</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/83.597272</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Au</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Geometry-aware fruit grasping estimation for robotic harvesting in apple orchards</article-title>. <source>Comput. Electron. Agric.</source> <volume>193</volume>, <elocation-id>106716</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106716</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khaki</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Crop yield prediction using deep neural networks</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2019.00621</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>W.-S.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>D.-H.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>Y.-J.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Hwang</surname> <given-names>R.-Y.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>H.-J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Path detection for autonomous traveling in orchards using patch-based CNN</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>175</volume>, <elocation-id>105620</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105620</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lei</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Yao</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Detection and modeling of unstructured roads in forest areas based on visual-2D lidar data fusion</article-title>. <source>Forests</source> <volume>12</volume>, <elocation-id>820</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/f12070820</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y. J.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Q. C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>Z. C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Advance of target visual information acquisition technology for fresh fruit robotic harvesting: a review</article-title>. <source>Agronomy-Basel</source> <volume>12</volume> (<issue>6</issue>), <elocation-id>1336</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy12061336</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Multi-class detection of kiwifruit flower and its distribution identification in orchard based on YOLOv5l and euclidean distance</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>201</volume>, <elocation-id>107342</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107342</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Hong</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A SVM and SLIC based detection method for paddy field boundary line</article-title>. <source>Sensors</source> <volume>20</volume> (<issue>9</issue>), <elocation-id>2610</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s20092610</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Qiao and L. Zhang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A multi-scale cucumber disease detection method in natural scenes based on YOLOv5</article-title>. <source>Comput. And Electron. In Agric.</source> <volume>202</volume>, <fpage>107363</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107363</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Road extraction algorithm based on intrinsic image and vanishing point for unstructured road image</article-title>. <source>Robotics Autonomous Systems.</source> <volume>109</volume>, <fpage>86</fpage>&#x2013;<lpage>96</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.robot.2018.08.011</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Qin</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Impact of epidemic-affected labor shortage on food safety: a Chinese scenario analysis using the CGE model</article-title>. <source>FOODS</source> <volume>10</volume> (<issue>11</issue>), <elocation-id>2679</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/foods10112679</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liao</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Babiker</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>W.-f.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Dandelion segmentation with background transfer learning and RGB-attention module</article-title>. <source>Comput. Electron. Agric.</source> <volume>202</volume>, <elocation-id>107355</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107355</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Sharp</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>COVID-19 pandemic, technological progress and food security based on a dynamic CGE model</article-title>. <source>Sustainability</source> <volume>14</volume> (<issue>3</issue>), <elocation-id>1842</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/su14031842</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Collision-free path planning for a guava-harvesting robot based on recurrent deep reinforcement learning</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>188</volume>, <elocation-id>106350</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2021.106350</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Dobaie</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Zhuang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Autonomous road detection and modeling for UGVs using vision-laser data fusion</article-title>. <source>Neurocomputing</source> <volume>275</volume>, <fpage>2752</fpage>&#x2013;<lpage>2761</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.neucom.2017.11.042</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Noise suppression of the reconstruction of infrared digital holography based on pyramid-based bilateral filter</article-title>. <source>Infrared Phys. Technol.</source> <volume>85</volume>, <fpage>352</fpage>&#x2013;<lpage>358</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.infrared.2017.07.023</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lv</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Rong</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>A visual identification method for the apple growth forms in the orchard</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>197</volume>, <elocation-id>106954</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106954</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lyu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Fan</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Green citrus detection and counting in orchards based on YOLOv5-CS and AI edge system</article-title>. <source>Sensors</source> <volume>22</volume>, <elocation-id>576</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/s22020576</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Qureshi</surname> <given-names>W. S.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Autonomous navigation for a wolfberry picking robot using visual cues and fuzzy control</article-title>. <source>Inf. Process. Agriculture.</source> <volume>8</volume> (<issue>1</issue>), <fpage>15</fpage>&#x2013;<lpage>26</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.inpa.2020.04.005</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meyer</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Hindman</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Laksmi</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Machine vision detection parameters for plant species identification</article-title>. <source>Proc. SPIE - Int. Soc. Optical Eng.</source> <volume>3543</volume>, <fpage>327</fpage>&#x2013;<lpage>335</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1117/12.336896</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nawaz</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Bhatti</surname> <given-names>U. A.</given-names>
</name>
<name>
<surname>Bazai</surname> <given-names>S. U.</given-names>
</name>
<name>
<surname>Zafar</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bhatti</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>A hybrid approach to forecast the COVID-19 epidemic trend</article-title>. <source>PloS One</source> <volume>16</volume> (<issue>10</issue>), <elocation-id>e0256971</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0256971</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ning</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Ding</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Recognition of sweet peppers and planning the robotic picking sequence in high-density orchards</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>196</volume>, <elocation-id>106878</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106878</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Color model analysis and Recognition for parts of citrus based on exploratory data analysis</article-title>. <source>Trans. Chin. Soc. Agric. Machinery</source> <volume>44</volume> (<issue>S1</issue>), <fpage>253</fpage>&#x2013;<lpage>259</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.6041/j.issn.1000-1298.2013.S1.045</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Phung</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Le</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bouzerdoum</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Pedestrian lane detection in unstructured scenes for assistive navigation</article-title>. <source>Comput. Vision Image Understanding.</source> <volume>149</volume>, <fpage>186</fpage>&#x2013;<lpage>196</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cviu.2016.01.011</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qi</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>An improved YOLOv5 model based on visual attention mechanism: application to recognition of tomato virus disease</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>194</volume>, <elocation-id>106780</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106780</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qi</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chuanxiang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>R.</given-names>
</name>
<name>
<surname>He</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Unstructured road detection <italic>via</italic> combining the model-based and feature-based methods</article-title>. <source>IET Intelligent Transport Syst.</source> <volume>13</volume>, <fpage>1533</fpage>&#x2013;<lpage>1544</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1049/iet-its.2018.5576</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rong</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Fruit pose recognition and directional orderly grasping strategies for tomato harvesting robots</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>202</volume>, <elocation-id>107430</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107430</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Routray</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Malla</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Sharma</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Panda</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Palai</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A new image denoising framework using bilateral filtering based non-subsampled shearlet transform</article-title>. <source>Optik</source> <volume>216</volume>, <elocation-id>164903</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ijleo.2020.164903</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rysz</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Mehta</surname> <given-names>S. S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A risk-averse optimization approach to human-robot collaboration in robotic fruit harvesting</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>182</volume>, <elocation-id>106018</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2021.106018</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Safarik</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Baldikova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Prochazkova</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Pospiskova</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Smartphone-based image analysis for evaluation of magnetic textile solid phase extraction of colored compounds</article-title>. <source>Heliyon</source> <volume>5</volume> (<issue>12</issue>), <elocation-id>e02995</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.heliyon.2019.e02995</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>She</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhan</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Hong</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Min</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Dong</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>A method for automatic real-time detection and counting of fruit fly pests in orchards by trap bottles <italic>via</italic> convolutional neural network with attention mechanism added</article-title>. <source>Ecol. Informatics.</source> <volume>70</volume>, <elocation-id>101690</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecoinf.2022.101690</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A neutrosophic-entropy based clustering algorithm (NEBCA) with HSV color system: a special application in segmentation of parkinson&#x2019;s disease (PD) MR images</article-title>. <source>Comput. Methods Programs Biomedicine.</source> <volume>189</volume>, <elocation-id>105317</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cmpb.2020.105317</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Alvarez</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kong</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An illumination-invariant nonparametric model for urban road detection</article-title>. <source>IEEE Trans. Intell. Veh.</source> <volume>4</volume> (<issue>1</issue>), <fpage>14</fpage>&#x2013;<lpage>23</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TIV.2018.2886689</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Semantic segmentation and path planning for orchards based on UAV images</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>200</volume>, <elocation-id>107222</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107222</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Leite</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>a). <article-title>Editorial: precision control technology and application in agricultural pest and disease control</article-title>. <source>Front. Plant Sci.</source> <volume>14</volume>, <elocation-id>1163839</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2023.1163839</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lian</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Recognition and localization methods for vision-based fruit picking robots: a review</article-title>. <source>Front. Plant Science.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.00510</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Qiu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>K.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>b). <article-title>Optimization strategies of fruit detection to overcome the challenge of unstructured background in field orchard environment: a review</article-title>. <source>Precis. Agric</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11119-023-10009-9</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2023</year>c). <article-title>Fruit detection and positioning technology for a camellia oleifera c. Abel orchard based on improved YOLOv4-tiny model and binocular stereo vision</article-title>. <source>Expert Syst. WITH APPLICATIONS.</source> <volume>211</volume>, <elocation-id>118573</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.eswa.2022.118573</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C.-Y.</given-names>
</name>
<name>
<surname>Bochkovskiy</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>H.-y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>YOLOv7: trainable bag-of-freebies sets new state-of-the-art for real-time object detectors</article-title>. <source>Arxiv</source> doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.2207.02696</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>W. S.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Choi</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Gan</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Diamond</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Detection and counting of immature green citrus fruit based on the local binary patterns (LBP) feature using illumination-normalized images</article-title>. <source>Precis. Agric.</source> <volume>19</volume>, <fpage>1062</fpage>&#x2013;<lpage>1083</lpage> doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11119-018-9574-5</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Huashuai</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Road detection based on illuminant invariance and quadratic estimation</article-title>. <source>Optik</source> <volume>185</volume>, <fpage>672</fpage>&#x2013;<lpage>684</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ijleo.2019.04.026</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Rapid citrus harvesting motion planning with pre-harvesting point and quad-tree</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>202</volume>, <elocation-id>107348</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107348</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Window zooming&#x2013;based localization algorithm of fruit and vegetable for harvesting robot</article-title>. <source>IEEE Access.</source> <volume>7</volume>, <fpage>103639</fpage>&#x2013;<lpage>103649</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/ACCESS.2019.2925812</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Low illumination color image enhancement based on gabor filtering and retinex theory</article-title>. <source>Multimedia Tools Applications.</source> <volume>80</volume> (<issue>12</issue>), <fpage>17705</fpage>&#x2013;<lpage>17719</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11042-021-10607-7</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Field rice panicle detection and counting based on deep learning</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.966495</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Fast detection of cannibalism behavior of juvenile fish based on deep learning</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>198</volume>, <elocation-id>107033</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107033</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woebbecke</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Meyer</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Bargen</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Mortensen</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Plant species identification, size, and enumeration using machine vision techniques on near-binary images</article-title>. <source>SPIE Optics Agric. Forestry</source> <volume>1836</volume>, <fpage>208</fpage>&#x2013;<lpage>219</lpage>. doi: <pub-id pub-id-type="doi">10.1117/12.144030</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Woebbecke</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Meyer</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Bargen</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Mortensen</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Color indices for weed identification under various soil, residue, and lighting conditions</article-title>. <source>Trans. ASAE.</source> <volume>38</volume>, <fpage>259</fpage>&#x2013;<lpage>269</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.13031/2013.27838</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Ai</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Rachis detection and three-dimensional localization of cut off point for vision-based banana robot</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>198</volume>, <elocation-id>107079</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.107079</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>F. Y.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S. Y.</given-names>
</name>
<name>
<surname>Ye</surname> <given-names>Y. X.</given-names>
</name>
<name>
<surname>Ai</surname> <given-names>P. Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Multi-target recognition of bananas and automatic positioning for the inflorescence axis cutting point</article-title>. <source>Front. In Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.705021</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Coefficient of restitution of kiwifruit without external interference</article-title>. <source>J. Food Engineering.</source> <volume>327</volume>, <elocation-id>111060</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jfoodeng.2022.111060</pub-id>
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Road extraction of high-resolution remote sensing images derived from DenseUNet</article-title>. <source>Remote Sens.</source> <volume>11</volume> (<issue>21</issue>), <elocation-id>2499</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs11212499</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Sehdev</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>An illumination robust road detection method based on color names and geometric information</article-title>. <source>Cogn. Syst. Res.</source> <volume>52</volume>, <fpage>240</fpage>&#x2013;<lpage>250</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cogsys.2018.06.019</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Xie</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>P.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Design of an efficient combined multipoint picking scheme for tea buds</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>, <elocation-id>1042035</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.1042035</pub-id>
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Review of smart robots for fruit and vegetable picking in agriculture</article-title>. <source>Int. J. Agric. Biol. Engineering.</source> <volume>14</volume>, <fpage>33</fpage>&#x2013;<lpage>54</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.25165/j.ijabe.20221501.7232</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Ouyang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Visual navigation path extraction of orchard hard pavement based on scanning method and neural network</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>197</volume>, <elocation-id>106964</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106964</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>SDUNet: road extraction <italic>via</italic> spatial enhanced and densely connected UNet</article-title>. <source>Pattern Recognit.</source> <volume>126</volume>, <elocation-id>108549</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.patcog.2022.108549</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ye</surname> <given-names>C.-w.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>Z.-w.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Yousaf</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Qi</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>K.-j.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>An experimental study of stunned state detection for broiler chickens using an improved convolution neural network algorithm</article-title>. <source>Comput. Electron. Agric.</source> <volume>170</volume>, <elocation-id>105284</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2020.105284</pub-id>
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ru</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Q.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Detection method of wheat spike improved YOLOv5s based on the attention mechanism</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>, <elocation-id>993244</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.993244</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>YOLO5-spear: a robust and real-time spear tips locator by improving image augmentation and lightweight network for selective harvesting robot of white asparagus</article-title>. <source>Biosyst. Engineering.</source> <volume>218</volume>, <fpage>43</fpage>&#x2013;<lpage>61</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biosystemseng.2022.04.006</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Qiao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>He</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Deep learning based automatic grape downy mildew detection</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>, <elocation-id>872107</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.872107</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Research on multi-image and multi-parameter fusion algorithm based on detail restoration</article-title>. <source>Multimedia Tools Applications.</source> <volume>81</volume> (<issue>12</issue>), <fpage>16589</fpage>&#x2013;<lpage>16600</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11042-022-12682-w</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z. Q.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Yin</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Cut-edge detection method for wheat harvesting based on stereo vision</article-title>. <source>Comput. Electron. Agriculture.</source> <volume>197</volume>, <elocation-id>106910</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2022.106910</pub-id>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Precision detection of crop diseases based on improved YOLOv5 model</article-title>. <source>Front. Plant Sci.</source> <volume>13</volume>, <elocation-id>1066835</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2022.1066835</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Adaptive active positioning of camellia oleifera fruit picking points: classical image processing and YOLOv7 fusion algorithm</article-title>. <source>Appl. Sci.</source> <volume>12</volume> (<issue>24</issue>), <elocation-id>12959</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/app122412959</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Xia</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Design and experiment of visual navigated UGV for orchard based on hough matrix and RANSAC</article-title>. <source>Int. J. Agric. Biol. Engineering.</source> <volume>14</volume>, <fpage>176</fpage>&#x2013;<lpage>184</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.25165/j.ijabe.20211406.5953</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>