<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="methods-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1258521</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Total and component forest aboveground biomass inversion via LiDAR-derived features and machine learning algorithms</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Ma</surname>
<given-names>Jiamin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2365036"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Wangfei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Ji</surname>
<given-names>Yongjie</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Jimao</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Guoran</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Lu</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Forestry, Southwest Forestry University</institution>, <addr-line>Kunming</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>College of Geography and Ecotourism, Southwest Forestry University</institution>, <addr-line>Kunming</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Aisino Xinde Zhitu (Beijing) Technology Co</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Dzarifah Zulperi, Universiti Putra Malaysia, Malaysia</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Luigi Saulino, University of Naples Federico II, Italy; Akhouri Pramod Krishna, Birla Institute of Technology, Mesra, India</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Yongjie Ji, <email xlink:href="mailto:jiyongjie@live.cn">jiyongjie@live.cn</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>26</day>
<month>10</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1258521</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>07</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>10</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Ma, Zhang, Ji, Huang, Huang and Wang</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Ma, Zhang, Ji, Huang, Huang and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Forest aboveground biomass (AGB) and its biomass components are key indicators for assessing forest ecosystem health, productivity, and carbon stocks. Light Detection and Ranging (LiDAR) technology has great advantages in acquiring the vertical structure of forests and the spatial distribution characteristics of vegetation. In this study, the 56 features extracted from airborne LiDAR point cloud data were used to estimate forest total and component AGB. Variable importance&#x2013;in&#x2013;projection values calculated through a partial least squares regression algorithm were utilized for LiDAR-derived feature ranking and optimization. Both leave-one-out cross-validation (LOOCV) and cross-validation methods were applied for validation of the estimated results. The results showed that four cumulative height percentiles (<italic>AIH</italic>
<sub>30,</sub> <italic>AIH</italic>
<sub>40</sub>, <italic>AIH</italic>
<sub>20</sub>, and <italic>AIH</italic>
<sub>25</sub>), two height percentiles (<italic>H</italic>
<sub>8</sub> and <italic>H</italic>
<sub>6</sub>), and four height-related variables (<italic>H</italic>
<sub>mean</sub>, <italic>H</italic>
<sub>sqrt</sub>, <italic>H</italic>
<sub>mad</sub>, and <italic>H</italic>
<sub>curt</sub>) are ranked more frequently in the top 10 sensitive features for total and component forest AGB retrievals. Best performance was acquired by random forest (RF) algorithm, with <italic>R</italic>
<sup>2&#xa0;=&#xa0;</sup>0.75, root mean square error (RMSE) = 22.93 Mg/ha, relative RMSE (rRMSE) = 25.30%, and mean absolute error (MAE) = 19.26 Mg/ha validated by the LOOCV method. For cross-validation results, <italic>R</italic>
<sup>2</sup> is 0.67, RMSE is 24.56 Mg/ha, and rRMSE is 25.67%. The performance of support vector regression (SVR) for total AGB estimation is <italic>R</italic>
<sup>2&#xa0;=&#xa0;</sup>0.66, RMSE = 26.75 Mg/ha, rRMSE = 28.62%, and MAE = 22.00 Mg/ha using LOOCV validation and <italic>R</italic>
<sup>2&#xa0;=&#xa0;</sup>0.56, RMSE = 30.88 Mg/ha, and rRMSE = 31.41% by cross-validation. For the component AGB estimation, the accuracy from both RF and SVR algorithms was arranged as stem &gt; bark &gt; branch &gt; leaf. The results confirmed the sensitivity of LiDAR-derived features to forest total and component AGBs. They also demonstrated the worse performance of these features for retrieval of leaf component AGB. RF outperformed SVR for both total and component AGB estimation, the validation difference from LOOCV and cross-validation is less than 5% for both total and component AGB estimated results.</p>
</abstract>
<kwd-group>
<kwd>forest total and component AGB</kwd>
<kwd>machine learning</kwd>
<kwd>LiDAR</kwd>
<kwd>validation methods</kwd>
<kwd>random forest</kwd>
</kwd-group>
<counts>
<fig-count count="13"/>
<table-count count="7"/>
<equation-count count="5"/>
<ref-count count="52"/>
<page-count count="17"/>
<word-count count="7439"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Sustainable and Intelligent Phytoprotection</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>The forest is the most important terrestrial ecosystem on Earth, playing a critical role in the global carbon cycle and terrestrial biosphere (<xref ref-type="bibr" rid="B12">He et&#xa0;al., 2007</xref>). The aboveground biomass (AGB) of forest is an important parameter that characterizes their carbon sequestration capacity. Because forest biomass affects a range of ecosystem processes, such as carbon and water cycles, energy fluxes, and thus local and regional climate, the development of sustainable forest management strategies requires accurate information on forest AGB (<xref ref-type="bibr" rid="B42">Urbazaev et&#xa0;al., 2018</xref>). Quantitative estimates of aboveground forest biomass provide basic data to support the carbon cycle of the global forest biomass system, thus contributing to the development of global carbon reduction policies and climate change mitigation and providing the necessary information for the development of sustainable forest management (<xref ref-type="bibr" rid="B7">Dixon et&#xa0;al., 1994</xref>; <xref ref-type="bibr" rid="B4">Cao et&#xa0;al., 2014</xref>). Forest AGB is all aboveground living material, and it includes partitioned biomass components like stem, bark, leaves, and branches (<xref ref-type="bibr" rid="B49">Zhang et&#xa0;al., 2011</xref>). Biomass components provide important information for forest management decisions. For example, knowledge of crown biomass aids fuel load assessment and strategies of fire management. Although knowledge of the contribution of each component to AGB is crucial for studying forest growth, it is essential to understand how these components interact with each other (<xref ref-type="bibr" rid="B23">Lambert et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B35">Saatchi et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B13">He et&#xa0;al., 2013</xref>). Meanwhile, the saturation problems resulted from the low penetration of short electromagnetic wave in the forest with high AGB level are the bottleneck problems in forest AGB inversion using remote sensing technology, and accurate estimation of biomass components can improve the estimation saturation points in AGB estimation and reduce the uncertainty of carbon sink estimation, which is the key to quantify carbon stock and plays an important role in modern forest and ecosystem management (<xref ref-type="bibr" rid="B18">Jia et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B32">Nie et&#xa0;al., 2017</xref>). Therefore, accurate forest total AGB and forest AGB components are crucial. However, accurate estimation of forest total AGB and biomass components is still a challenging task in forestry research at present.</p>
<p>Light Detection and Ranging (LiDAR) is a powerful tool for estimating AGB in forests with fine resolution, which provides detailed three-dimensional information about the forest structure by emitting LiDAR pulses that penetrate the canopy. This is closely related to the spatial heterogeneity of forest carbon content and habitat (<xref ref-type="bibr" rid="B1">Asner et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B43">Vaglio Laurin et&#xa0;al., 2016</xref>). Total and component AGB were investigated and estimated using LiDAR-derived features in previous research (<xref ref-type="bibr" rid="B31">N&#xe6;sset and Gobakken, 2008</xref>; <xref ref-type="bibr" rid="B41">Tsui et&#xa0;al., 2012</xref>; <xref ref-type="bibr" rid="B13">He et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B4">Cao et&#xa0;al., 2014</xref>). A large number of LiDAR-derived features were demonstrated to be useful of predicting biomass; however, they also revealed that the results were site or species dependent (<xref ref-type="bibr" rid="B50">Zhao et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B36">Salas et&#xa0;al., 2010</xref>). In parametric regression algorithms, the population assumptions of regression models are usually based on linear relationships. However, it is difficult to fully describe the complex non-linear relationship between forest AGB and LiDAR data using traditional statistical regression methods (<xref ref-type="bibr" rid="B51">Zhao et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B40">Torre-Tojal et&#xa0;al., 2022</xref>). Several studies found that machine learning algorithms, such as random forest (RF) and support vector regression (SVR) that abandoned the population assumptions that did not represent the heterogeneity of forest stands in parametric regression algorithms, performed better than parametric algorithms in forest AGB estimation (<xref ref-type="bibr" rid="B2">Breidenbach et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B44">Vauhkonen et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B10">Gleason and Im, 2012</xref>; <xref ref-type="bibr" rid="B11">G&#xf6;rgens et&#xa0;al., 2015</xref>). Therefore, many studies have applied machine learning algorithms for forest AGB estimation. The performance of machine learning algorithms applied in forest AGB estimation using LiDAR-derived features was not fully explored by far, and their capability for accurate AGB estimation has no agreement (<xref ref-type="bibr" rid="B10">Gleason and Im, 2012</xref>). Although the machine learning algorithms show a good performance, the large amount of data constrains the direct use features extracted from LiDAR data as input to the inversion models. For forest AGB estimation using remote sensing observations, a key step is to optimize the optimal features from abundant remote sensing observation (<xref ref-type="bibr" rid="B47">Yang et&#xa0;al., 2017</xref>). The importance of each extracted feature was interpreted and ranked by G&#xf6;rgens et&#xa0;al. (<xref ref-type="bibr" rid="B11">G&#xf6;rgens et&#xa0;al., 2015</xref>); however, the optimization of feature was not fully explored yet; especially, little was known about component AGB estimation.</p>
<p>For machine learning models to estimate forest AGB, the method of testing model performance is important and involves appropriate validation methods to determine the best predictive model. Leave-one-out cross-validation (LOOCV) and cross-validation are popular for validating the results of forest biophysical parameter estimation. However, how effectively can these two validation methods be used and how different are they and what impact do they have on the estimation results? In our knowledge, it is not addressed yet. According to abovementioned research gap, this study focuses on forest total and component AGB retrieval using height-related features extracted from LiDAR by RF and SVR algorithms. Partial least squares regression (PLSR) algorithm combining the advantages of both principal component analysis (PCA) and multiple linear regression (MLR) was used for ranking and selecting the optimal LiDAR features. LOOCV and cross-validation methods were utilized and compared for results validation. By comparing the two validation methods, we aim to improve the reliability of the model assessment, find the most suitable validation strategy for the inversion model and data in the study area, and improve the efficiency of the utilization of computational resources with the expectation that the model performs well in a variety of data scenarios. The objective is to address the effects of the validation methods and also explore the potential of RF and SVR for forest AGB and component biomass inversion and the potential of PLSR algorithm for selecting the optimal LiDAR-extracted features. To be more concise, we use forest total biomass to describe the forest AGB; biomass components to describe the stem, bark, leave, and branch component biomass; and forest AGBs to describe both total and component biomass. It is expected to provide a valuable reference for the selection of the validation methods in machine learning inverse forest biomass and component biomass studies.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Study area</title>
<p>The Daxinganling National Forest Ecosystem Locating Station is the study area, and it is located in Genhe City, Hulunbuir, Inner Mongolia (50&#xb0;20&#x2032;N&#x2013;52&#xb0;30&#x2032;N; 120&#xb0;12&#x2032;E&#x2013;122&#xb0;55&#x2032;E; <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>), which is the highest latitude forest ecosystem field scientific observation station in China. Genhe is one of the cities with the highest latitude in China and the lowest average temperature in Inner Mongolia Autonomous Region, with an annual average temperature of &#x2212;11&#xb0;C~5&#xb0;C. The terrain in the study area is comparatively flat, over 80% of the study area with slopes less than 15&#xb0;. The average elevation is 1,000 m, and the elevation ranges from 700&#xa0;m to 1300&#xa0;m. The climate here is a cold-temperate humid forest climate and has some characteristics of continental monsoon climate, a typical area of high latitude permafrost and cold-temperate forest ecosystems. It is cold and wet, with long winters and short summers. The forest cover of the study area is more than 75%, and the main forest type is cold-temperate coniferous forest with complex forest vertical structure. The dominant tree species included in the field-sampled plots are <italic>Larix gmelinii</italic> and <italic>Betula platyphylla</italic>. These tree species covered around 95% of the forest type in the study area. The detailed information regarding tree species coverage is shown in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Location and sample plot distribution of study area.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Remote sensing data collection and pre-processing</title>
<sec id="s2_2_1">
<label>2.2.1</label>
<title>Collection of LiDAR data</title>
<p>In this study, aerial LiDAR data were acquired and utilized to extract features for forest AGB inversion. The LiDAR data were collected during August to September 2012, using the &#x201c;Yun-5&#x201d; manned aircraft equipped with a RIEGL LMS-Q680i laser sensor. During this campaign, the average flying altitude of the airborne platform was 2,700 m, with an average flying speed of 220 km/h, and 32 parallel flight tracks were acquired. The laser pulse frequency was 100&#x2013;200 kHz with a scan angle of &#xb1;35&#xb0; perpendicular to the flight direction. The average point cloud density was 5.6 points/m&#xb2;, and the scan overlap rate was about 80%. The acquired area in this campaign were 213 km&#xb2;. The data format was LAS1.4, and the sensor recorded the three-dimensional coordinate information (x, y, z) of each laser return point, as well as information such as the number of point clouds, intensity, and return type. The detail information of performance of RIEGL LMS-Q680i laser sensor are shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. The maximum pulse repetition rate was 200 kHz, the maximum scanning frequency was 100&#xa0;Hz, the wavelength of the pulsed laser was 1,064 nm, and the relative flying height ranged from 200 to 5,000 m. The maximum scanning angle was 75&#xb0; (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>The performance of the RIEGL LMS-Q680i laser sensor for LiDAR data collection.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Index</th>
<th valign="middle" align="center">Value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Maximum pulse repetition rate/kHZ</td>
<td valign="middle" align="center">200</td>
</tr>
<tr>
<td valign="middle" align="center">Maximum scanning frequency/Hz</td>
<td valign="middle" align="center">100</td>
</tr>
<tr>
<td valign="middle" align="center">pulse laser wavelength/nm</td>
<td valign="middle" align="center">1,064</td>
</tr>
<tr>
<td valign="middle" align="center">Relative flight height/m</td>
<td valign="middle" align="center">200&#x2013;5,000</td>
</tr>
<tr>
<td valign="middle" align="center">Maximum scanning angle/(&#xb0;)</td>
<td valign="middle" align="center">75</td>
</tr>
<tr>
<td valign="middle" align="center">Point density/(number m<sup>&#x2212;2</sup>)</td>
<td valign="middle" align="center">&gt;4</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_2_2">
<label>2.2.2</label>
<title>Preprocessing of LiDAR data</title>
<p>The raw LiDAR data were processed by the research group of Chinese Academy of Forestry (CAF) through three main steps, namely, full waveform decomposition, geocoding, and boresight calibration (<xref ref-type="bibr" rid="B33">Pang et&#xa0;al., 2016</xref>). The preprocessing steps for the LiDAR data in this research include point cloud denoising, point cloud filtering, point cloud classification, and normalization of LiDAR point cloud data. Here, the normalization removes the influence of terrain undulations on the elevation values of the point cloud data, requiring that the range of the DEM has an intersection area with the range of the point cloud data, and the process is to subtract the corresponding DEM elevation value found from the elevation value Z for each point. LiDAR360 software was used for the left preprocessing of LiDAR data, and, then, the preprocessed LiDAR data were used to extract features for forest AGB estimation (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The results of the pre-processed LiDAR point cloud data were shown as <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Point cloud data preprocessed results. <bold>(A)</bold> Raw point cloud data of the study area. <bold>(B)</bold> Point cloud data before normalization. <bold>(C)</bold> Point cloud data after normalization.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g002.tif"/>
</fig>
</sec>
<sec id="s2_2_3">
<label>2.2.3</label>
<title>LiDAR feature extraction</title>
<p>After data preprocessing, a total of 56 LiDAR feature parameters were extracted (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>). The extraction of these parameters was based on previous research findings (<xref ref-type="bibr" rid="B29">Liu et al., 2018</xref>; <xref ref-type="bibr" rid="B30">Micha&#x142;owska and Rapi&#x144;, 2021</xref>; <xref ref-type="bibr" rid="B52">Zhou et al., 2022</xref>). To determine the density of point cloud data based on height, the data were split into 10 equally sized height layers for points above 2&#xa0;m. Within each layer, the ratio of the number of points to the total number of points was calculated, resulting in a density feature parameter. This method offers a way to analyze point density at different heights, which can help reveal patterns and features of the object being scanned.</p>
</sec>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Field campaign and processing of the collected plot measurements</title>
<sec id="s2_3_1">
<label>2.3.1</label>
<title>Collection of plot data</title>
<p>The ground plot data used in this study were collected through field surveys conducted in the Genhe during August in 2012 and 2013 and used for training and validation of the forest AGB inversion models. The collected plots included 25 fixed plots of 40&#xa0;m &#xd7; 40&#xa0;m surveyed in 2012 and 18 plots of 45&#xa0;m &#xd7; 45&#xa0;m investigated in 2013. Differential Global Positioning System (GPS) was used to locate the four corner coordinates of each plot, and the errors of plot boundary and position were controlled within 1&#xa0;m. In each sample plot, diameter at breast height (DBH), tree height (H), and tree species were recorded for trees with DBH &#x2265; 5&#xa0;cm.</p>
</sec>
<sec id="s2_3_2">
<label>2.3.2</label>
<title>Aboveground biomass calculation</title>
<p>Forest total biomass and component biomass of each tree were calculated by allometric equations and component equations published by the State Forestry Administration of China (<xref ref-type="bibr" rid="B38">State Forestry Administration of China, 2016a</xref>; <xref ref-type="bibr" rid="B39">State Forestry Administration of China, 2016b</xref>). Then, the total AGB and component AGBs of each plot were calculated by the sum of each tree in the plot with normalization by area of each sample plot (<xref ref-type="bibr" rid="B26">Li et&#xa0;al., 2015</xref>).</p>
<p>In this study, two tree species, namely, <italic>Larix gmelinii</italic> and <italic>Betula platyphylla</italic>, were involved, and the corresponding equations for AGB calculation are shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>. <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref> and <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> show the statistics of calculated forest total and component AGBs.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Equations for calculating total and component AGBs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">AGB</th>
<th valign="middle" align="center">Equations</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Total AGB (<inline-formula>
<mml:math display="inline" id="im18">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td valign="middle" align="left">
<inline-formula>
<mml:math display="inline" id="im19">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>060848</mml:mn>
<mml:msup>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:mn>2.01549</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.59146</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:mi>H</mml:mi>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>5.0</mml:mn>
<mml:mi>c</mml:mi>
<mml:mi>m</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
<inline-formula>
<mml:math display="inline" id="im20">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.06807</mml:mn>
<mml:msup>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:mn>0.10850</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.52019</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:mi>H</mml:mi>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>5.0</mml:mn>
<mml:mi>c</mml:mi>
<mml:mi>m</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="middle" align="center">
<italic>Larix gmelinii</italic>: 0.9690<break/>
<italic>Betula platyphylla</italic>: 0.9550</td>
</tr>
<tr>
<td valign="middle" align="center">Stem biomass (<inline-formula>
<mml:math display="inline" id="im21">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td valign="middle" align="center">
<inline-formula>
<mml:math display="inline" id="im22">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="middle" align="center">
<italic>Larix gmelinii</italic>: 0.9701<break/>
<italic>Betula platyphylla</italic>: 0.9545</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass (<inline-formula>
<mml:math display="inline" id="im23">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td valign="middle" align="center">
<inline-formula>
<mml:math display="inline" id="im24">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="middle" align="center">
<italic>Larix gmelinii</italic>: 0.8817<break/>
<italic>Betula platyphylla</italic>: 0.8678</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass (<inline-formula>
<mml:math display="inline" id="im25">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td valign="middle" align="center">
<inline-formula>
<mml:math display="inline" id="im26">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="middle" align="center">
<italic>Larix gmelinii</italic>: 0.8513<break/>
<italic>Betula platyphylla</italic>: 0.9545</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass (<inline-formula>
<mml:math display="inline" id="im27">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>f</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>)</td>
<td valign="middle" align="center">
<inline-formula>
<mml:math display="inline" id="im28">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>f</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td valign="middle" align="center">
<italic>Larix gmelinii</italic>: 0.7439<break/>
<italic>Betula platyphylla</italic>: 0.6311</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>
<inline-formula>
<mml:math display="inline" id="im29">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the AGB of a Larch (kg); <inline-formula>
<mml:math display="inline" id="im30">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the AGB of a Birch (kg); <inline-formula>
<mml:math display="inline" id="im31">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the estimated AGB of tree species (kg); <inline-formula>
<mml:math display="inline" id="im32">
<mml:mi>H</mml:mi>
</mml:math>
</inline-formula> is the height of the tree (m); <inline-formula>
<mml:math display="inline" id="im33">
<mml:mi>D</mml:mi>
</mml:math>
</inline-formula> is the diameter of a tree measured at breast height (cm); <inline-formula>
<mml:math display="inline" id="im34">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im35">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im36">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im37">
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>f</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the AGB of stem, bark, branches, and leaves of each tree, respectively; <inline-formula>
<mml:math display="inline" id="im38">
<mml:mrow>
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im39">
<mml:mrow>
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im40">
<mml:mrow>
<mml:msub>
<mml:mi>g</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the proportional functions of bark, branches, and leaves, respectively, relative to stem biomass of 1.</p>
</fn>
<fn>
<p>Larix gmelinii: <inline-formula>
<mml:math display="inline" id="im41">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.36742</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.16892</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.17313</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im42">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>2.30634</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.72188</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.45081</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im43">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1.57804</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.19527</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.36274</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</fn>
<fn>
<p>
<italic>Betula platyphylla</italic>: <inline-formula>
<mml:math display="inline" id="im44">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.53498</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.09004</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.46520</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula>
<mml:math display="inline" id="im45">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>1.05167</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.66925</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.04662</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im46">
<mml:mrow>
<mml:msub>
<mml:mi>&#x261;</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>0.61793</mml:mn>
<mml:mi>D</mml:mi>
<mml:mi>B</mml:mi>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mn>0.17097</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mi>H</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.88182</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>
</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>The distribution of total and component AGB for each plot.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g003.tif"/>
</fig>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Statistics of calculated total and component AGBs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Type</th>
<th valign="middle" align="center">Mean/(t ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">Maximum/(t ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">Minimum/(t ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">Standard deviation/(t ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">Standard error/(t ha<sup>&#x2212;1</sup>)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Total AGB</td>
<td valign="middle" align="center">92.80</td>
<td valign="middle" align="center">203.53</td>
<td valign="middle" align="center">20.40</td>
<td valign="middle" align="center">46.32</td>
<td valign="middle" align="center">7.06</td>
</tr>
<tr>
<td valign="middle" align="center">Stem biomass</td>
<td valign="middle" align="center">61.14</td>
<td valign="middle" align="center">142.80</td>
<td valign="middle" align="center">10.41</td>
<td valign="middle" align="center">32.66</td>
<td valign="middle" align="center">4.98</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass</td>
<td valign="middle" align="center">18.12</td>
<td valign="middle" align="center">35.72</td>
<td valign="middle" align="center">5.77</td>
<td valign="middle" align="center">8.51</td>
<td valign="middle" align="center">1.30</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass</td>
<td valign="middle" align="center">9.15</td>
<td valign="middle" align="center">17.77</td>
<td valign="middle" align="center">2.37</td>
<td valign="middle" align="center">4.27</td>
<td valign="middle" align="center">0.65</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass</td>
<td valign="middle" align="center">4.39</td>
<td valign="middle" align="center">8.30</td>
<td valign="middle" align="center">1.26</td>
<td valign="middle" align="center">1.63</td>
<td valign="middle" align="center">0.25</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Methodology</title>
<p>
<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref> illustrates the framework of this study; first, LiDAR-derived features were extracted as independent variables, and the total and component AGB of each plot were calculated worked as dependent variables; second, PLSR algorithm was used for optimal independent variables selection; third, SVR and RF algorithms were trained for estimating forest total and component AGB; finally, validation and comparative analysis were performed (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Strategy of identifying suitable LiDAR-derived features (PLSR) and suitable forest total and component AGBs modeling approach (RF and SVR).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g004.tif"/>
</fig>
<sec id="s2_4_1">
<label>2.4.1</label>
<title>LiDAR-derived feature selection using partial least squares regression</title>
<p>PLSR was a multivariate statistical analysis algorithm. It could achieve quantitative analysis in the case of multiple correlation of independent variables and could easily exclude the noise in the independent variables. It combined the advantages of PCA and MLR and had outstanding advantages in solving the problems that were difficult to analyze in MLR and in dealing with the problem of multiple cointegration among independent variables. PLSR algorithm optimizes linear regression models to project the input LiDAR-derived features and output AGB into new orthogonal spaces with better predictive capabilities, and it was effective for large number of explanatory LiDAR-derived features that were often not independent of each other. For the procedure of selecting the variables, in this study, by maximizing the covariance between projected LiDAR-derived features and the total forest biomass or component biomass, the orthogonal loading matrix could be solved, and, then, the number of explanatory features for AGB or component biomass was significantly reduced. During the procedure, VIP [variable importance in projection; Equation (1)] values were calculated to optimize the LiDAR-derived measurements. The higher the VIP value, the more significant the independent variable was to the dependent variable; if all independent factors had identical explanatory power over dependent variable, then all VIP values were 1.</p>
<disp-formula>
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>V</mml:mi>
<mml:mi>I</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mi>k</mml:mi>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msup>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mi>r</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:msubsup>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im47">
<mml:mi>k</mml:mi>
</mml:math>
</inline-formula> is the number of independent variables, <inline-formula>
<mml:math display="inline" id="im48">
<mml:mrow>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is the principal component extracted from the independent variable of interest, <inline-formula>
<mml:math display="inline" id="im49">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>y</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>c</mml:mi>
<mml:mi>h</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the correlation coefficient between the dependent variable and the principal component, denoting the explanatory power of the principal component for <inline-formula>
<mml:math display="inline" id="im50">
<mml:mi>y</mml:mi>
</mml:math>
</inline-formula>, and <inline-formula>
<mml:math display="inline" id="im51">
<mml:mrow>
<mml:msub>
<mml:mi>w</mml:mi>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the weight of the independent variable on the principal component.</p>
</sec>
<sec id="s2_4_2">
<label>2.4.2</label>
<title>Machine learning approaches for forest AGB inversion</title>
<p>RF and SVR were selected and employed to predict forest total AGB and component AGB in this study. RF was based on decision trees, and the original training samples were randomly sampled with put-back by bootstrap algorithm, and the samples that are not included in the decision trees were used as test samples. For the regression problem, the predicted values of each decision tree in the RF were used to average the final predicted values (<xref ref-type="bibr" rid="B3">Breiman, 2001</xref>). In this study, we used the sklearn package of Python software to train and validate RF model for predicting forest total biomass and biomass components. The maximum feature variable (mtry) and the number of decision trees (ntree) were set as 100 and 15 during the model training procedure.</p>
<p>SVR seeks to obtain the best promotion ability based on a small number of samples by finding the optimal balance between the model&#x2019;s complexity and learning capacity (<xref ref-type="bibr" rid="B9">Drucker et&#xa0;al., 1997</xref>); SVR includes non-linear regression and linear regression algorithms; the basic idea of non-linear regression algorithm is to introduce a suitable kernel function in the sample dataset to map the data from low-dimensional space to high-dimensional space; then, the non-linear problem in low-dimensional space is converted into a linear problem in high-dimensional space. The linear regression is performed in this high-dimensional space, aiming to find the best fit line of the data, i.e., the hyperplane with the highest number of points that can accurately predict the data (<xref ref-type="bibr" rid="B6">Chen et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B46">Xue et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B45">Xiong and Li, 2019</xref>). In this study, the radial basis function was used as the kernel function, and the constant of the regularization term in the Lagrangian formula was equal to 1. SVR algorithms were implemented by sklearn package of Python software.</p>
</sec>
<sec id="s2_4_3">
<label>2.4.3</label>
<title>Validation algorithms</title>
<p>To validate the accuracy of inversion results, a LOOCV method and a cross-validation method were used. The basic idea of the LOOCV is to assume that there are N samples, from which N&#x2212;1 samples are selected for training, and the remaining samples are used for validation, and so on, until all samples are traversed, and the final result is the mean value of N validation errors. It is able to exclude the influence of random factors and ensures that the validation process is repeatable and has the advantage of almost unbiased generalization error estimates (<xref ref-type="bibr" rid="B28">Liu et&#xa0;al., 2011</xref>). When using the cross-validation method, RF and SVR build the model by randomly selecting 70% of the samples for model training and the remaining 30% for validation, and the procedure was performed 10 times and the average values were presented here.</p>
<p>Pearson&#x2019;s coefficient [<italic>R</italic>&#xb2;; Equation (2)] of determination, root mean square error [RMSE; Equation (3)], relative RMSE [rRMSE; Equation (4)], and mean absolute error [MAE; Equation (5)] were selected as indicators to predict the accuracy of the model.</p>
<disp-formula>
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="true">^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:msqrt>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="true">^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
</mml:mrow>
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
<mml:mo>%</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula>
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>m</mml:mi>
</mml:mfrac>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>m</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="true">^</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <inline-formula>
<mml:math display="inline" id="im52">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>^</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> is the predicted value of the model, <inline-formula>
<mml:math display="inline" id="im53">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the sample plot measurement, <inline-formula>
<mml:math display="inline" id="im54">
<mml:mover accent="true">
<mml:mi>y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:math>
</inline-formula> is the mean value of the sample plot measurement, and <inline-formula>
<mml:math display="inline" id="im55">
<mml:mi>m</mml:mi>
</mml:math>
</inline-formula> is the number of training and validation sample plots.</p>
</sec>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Optimized LiDAR-derived features</title>
<p>To find the best variables to predict the total and component AGB of the forest, observations with VIP value greater than 1.0 were selected for further AGB inversion (<xref ref-type="bibr" rid="B20">Ju et&#xa0;al., 2022</xref>). Since PLSR combines the advantages of PCA and MLR, it is effective to extract the reduced by more useful LiDAR-derived features for forest AGBs estimation, especially since input features were not independent of each other. Like the characteristic of PCA, 56 observations and output forest total or each AGB component were projected into new orthogonal spaces, which have better predictive capabilities, and, then, VIP values are calculated and sorted according to the interpreted variance (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). As shown in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>, the blue ones are selected features with VIP values greater than 1, and the gray ones are abandoned features. The 37 LiDAR-derived features were selected as features for leaf AGB estimation, and 32 features were selected for total AGB and biomass of other component estimation. Four cumulative height percentiles (<italic>AIH</italic>
<sub>30</sub>, <italic>AIH</italic>
<sub>40</sub>, <italic>AIH</italic>
<sub>20</sub>, and <italic>AIH</italic>
<sub>25</sub>) were selected as the top 10 variables for total AGB estimation, and two height percentiles (<italic>H</italic>
<sub>8</sub> and <italic>H</italic>
<sub>6</sub>) and four height-related variables (<italic>H</italic>
<sub>mean</sub>, <italic>H</italic>
<sub>sqrt</sub>, <italic>H</italic>
<sub>mad</sub>, and <italic>H</italic>
<sub>curt</sub>) were height-related variables.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>The VIP values of each LiDAR-derived feature graph (the blue ones are selected features with VIP values greater than 1, and the gray ones are abandoned features). From <bold>(A&#x2013;E)</bold>, the LiDAR characteristics of total biomass, stem, bark, branch and leaf were selected.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g005.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Forest AGB inversion using RF and SVR</title>
<sec id="s3_2_1">
<label>3.2.1</label>
<title>Forest AGB estimation results using RF</title>
<p>The LiDAR features selected by PLSR were input in the RF regression model for forest total biomass and biomass component inversion, and the inversion accuracy of the models was tested using LOOCV and cross-validation. <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref> graphs the estimation results validated using LOOCV, and <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref> summarizes the statistical information of the results from <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, which are the scatter points for the built models and validations of the models.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Forest total and component AGB estimation results using LOOCV validation. The solid lines in the scatter plots are 1:1 verification lines: <bold>(A)</bold> for total AGB, <bold>(B)</bold> for stem; <bold>(C)</bold> for bark, <bold>(D)</bold> for branch, and <bold>(E)</bold> for leaf.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g006.tif"/>
</fig>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>The LOOCV was used to check the accuracy results of the model (RF).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Components</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
<th valign="middle" align="center">MAE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Stem biomass</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">18.14</td>
<td valign="middle" align="center">30.26</td>
<td valign="middle" align="center">14.49</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass</td>
<td valign="middle" align="center">0.63</td>
<td valign="middle" align="center">2.58</td>
<td valign="middle" align="center">28.34</td>
<td valign="middle" align="center">2.21</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass</td>
<td valign="middle" align="center">0.65</td>
<td valign="middle" align="center">4.99</td>
<td valign="middle" align="center">27.33</td>
<td valign="middle" align="center">0.65</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass</td>
<td valign="middle" align="center">0.54</td>
<td valign="middle" align="center">1.10</td>
<td valign="middle" align="center">25.01</td>
<td valign="middle" align="center">0.87</td>
</tr>
<tr>
<td valign="middle" align="center">Total AGB</td>
<td valign="middle" align="center">0.75</td>
<td valign="middle" align="center">22.93</td>
<td valign="middle" align="center">25.30</td>
<td valign="middle" align="center">19.26</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>, when using the LOOCV validation method to estimated accuracy of the models, the RF model performed best for total AGB estimation (<italic>R</italic>
<sup>2</sup>&#xa0;=&#xa0;0.75, RMSE = 22.93 Mg/ha, rRMSE = 25.30%, and MAE = 19.26 Mg/ha). From the scatter plot of the model fit in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, the prediction results were positively and linearly correlated around the 1:1 line, and it shows some overestimation phenomena for low AGB values, but, with the increase of AGB values, the prediction trend become better with no saturation phenomenon for high AGB values. The accuracy for the stem biomass model (<italic>R</italic>
<sup>2</sup>&#xa0;=&#xa0;0.69, RMSE = 18.14 Mg/ha, rRMSE = 30.26%, and MAE = 14.49 Mg/ha) was slightly lower than that of the total AGB. The prediction trend in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6B</bold>
</xref> is similar to that in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6A</bold>
</xref> but with a slightly lower <italic>R</italic>
<sup>2</sup>. On the basis of the RMSE and MAE values, the error of the estimated component AGB is lower than the error of the total AGB. <xref ref-type="fig" rid="f6"><bold>Figures 6C&#x2013;E</bold></xref>, respectively represent the estimation results of forest biomass for stems, branches, and leaves using LOOCV validation.</p>
<p>
<xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref> and <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref> show the performance of the RF models with training and validation datasets. <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref> summarizes the information with model accuracies and validation accuracies. For model training, the constructed RF models showed good estimation results with all <italic>R</italic>
<sup>2</sup> greater than 0.80 and rRMSEs ranging from 12.66% to 16.21%, whereas the accuracies decreased when the constructed models were validated using the left out 30% samples. <italic>R</italic>
<sup>2</sup> ranges from 0.49 to 0.65, and rRMSE ranges from 26.37% to 31.89%. According to <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref> and <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>, the RF model for leaf component AGB estimation performed with the lowest <italic>R</italic>
<sup>2</sup> value during its training procedure does not show the highest rRMSE value although it has the lowest <italic>R</italic>
<sup>2</sup> value of 0.86. The scatter plots of both the individual components and the total biomass exhibit overestimation and underestimation phenomena. The results may result from the narrow dynamic range of leaf biomass. Meanwhile, the RF model for stem AGB estimation showed better performance even if its highest rRMSE of 16.21% during the model training procedure. However, the model constructed for total AGB estimations acquired highest <italic>R</italic>
<sup>2</sup> of 0.93 and lowest rRMSE of 12.66% during model training also performed best for validation procedure with highest <italic>R</italic>
<sup>2</sup> of 0.67 and lowest rRMSE of 25.67%.</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Cross-validation method to test the accuracy of RF models. The solid line is 1:1 verification line. In the figure, the first row shows the performance of the model on the training set. The second row shows the performance of the model on the test set.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g007.tif"/>
</fig>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>The cross-validation method was used to check the accuracy results of the model (RF).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Components</th>
<th valign="middle" colspan="3" align="center">Training set</th>
<th valign="middle" colspan="3" align="center">Test set</th>
</tr>
<tr>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha <sup>1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Stem biomass</td>
<td valign="middle" align="center">0.91</td>
<td valign="middle" align="center">9.92</td>
<td valign="middle" align="center">16.21</td>
<td valign="middle" align="center">0.60</td>
<td valign="middle" align="center">19.15</td>
<td valign="middle" align="center">31.89</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass</td>
<td valign="middle" align="center">0.90</td>
<td valign="middle" align="center">1.37</td>
<td valign="middle" align="center">14.97</td>
<td valign="middle" align="center">0.57</td>
<td valign="middle" align="center">2.51</td>
<td valign="middle" align="center">29.34</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass</td>
<td valign="middle" align="center">0.89</td>
<td valign="middle" align="center">2.70</td>
<td valign="middle" align="center">14.84</td>
<td valign="middle" align="center">0.65</td>
<td valign="middle" align="center">4.89</td>
<td valign="middle" align="center">28.32</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass</td>
<td valign="middle" align="center">0.86</td>
<td valign="middle" align="center">0.58</td>
<td valign="middle" align="center">13.09</td>
<td valign="middle" align="center">0.49</td>
<td valign="middle" align="center">0.99</td>
<td valign="middle" align="center">26.37</td>
</tr>
<tr>
<td valign="middle" align="center">Forest total biomass</td>
<td valign="middle" align="center">0.93</td>
<td valign="middle" align="center">11.89</td>
<td valign="middle" align="center">12.66</td>
<td valign="middle" align="center">0.67</td>
<td valign="middle" align="center">24.56</td>
<td valign="middle" align="center">25.67</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The results of both validation methods indicated that the LiDAR characteristic variables were strongly correlated with the total and component AGBs and that the RF model performed good for forest AGBs estimation.</p>
<p>
<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref> shows the comparison between the total and biomass components of the sample plots calculated by the stumpage biomass model and the model predictions. The ratios of stem, branch, bark, and leaf in the total biomass from the field collected datasets were 65.98%, 19.35%, 9.92%, and 4.75%, respectively. For the estimated total and component AGBs in the test site, leaf AGB accounts for the lowest ratio with 4.81% and branch and stem accounts for 85.24% of the total AGB. The distribution of each component to the total AGB from the predicted results have similar distribution pattern with the true values.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Comparison of total and biomass components of sample plots calculated by the standing wood biomass model with the predicted values from the RF model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g008.tif"/>
</fig>
</sec>
<sec id="s3_2_2">
<label>3.2.2</label>
<title>Forest AGB estimation results using SVR</title>
<p>The LOOCV and cross-validation methods were also applied for the validation of estimated AGBs by SVR (<xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>, <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>). Compared with the performance of RF, the overall prediction accuracies of SVR were lower. As shown in <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>, the SVR model performed best for total AGB estimation (<italic>R</italic>
<sup>2</sup>&#xa0;=&#xa0;0.66, RMSE = 26.75 Mg/ha, rRMSE = 28.62%, and MAE = 22.00 Mg/ha). From the scatter plot of the model fit in <xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref>, the prediction results were positively and linearly correlated around the 1:1 line. Underestimation occurs when AGB values are greater than 150 Mg/ha. Similar as the performance of RF, the <italic>R</italic>
<sup>2</sup> value for the stem biomass model was slightly lower than that of the total AGB. The scatter plot for stem shows similar trend with total AGB. The lowest <italic>R</italic>
<sup>2</sup> value was acquired for leaf AGB estimation. The rRMSE values for component AGB estimation range from 27.36% to 32.48%. For total and component forest total biomass estimation, the rRMSE values acquired by SAR were higher than that for the RF algorithms.</p>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>The leave-one-out verification statistics for the support vector regression model.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Components</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
<th valign="middle" align="center">MAE/(Mg/ha)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Stem biomass</td>
<td valign="middle" align="center">0.64</td>
<td valign="middle" align="center">19.52</td>
<td valign="middle" align="center">32.48</td>
<td valign="middle" align="center">16.02</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass</td>
<td valign="middle" align="center">0.62</td>
<td valign="middle" align="center">2.61</td>
<td valign="middle" align="center">28.73</td>
<td valign="middle" align="center">2.07</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass</td>
<td valign="middle" align="center">0.61</td>
<td valign="middle" align="center">5.30</td>
<td valign="middle" align="center">28.99</td>
<td valign="middle" align="center">4.34</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass</td>
<td valign="middle" align="center">0.45</td>
<td valign="middle" align="center">1.20</td>
<td valign="middle" align="center">27.36</td>
<td valign="middle" align="center">0.94</td>
</tr>
<tr>
<td valign="middle" align="center">Forest total biomass</td>
<td valign="middle" align="center">0.66</td>
<td valign="middle" align="center">26.75</td>
<td valign="middle" align="center">28.62</td>
<td valign="middle" align="center">22.00</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Leave-one-out validation method to test the accuracy of the support vector regression model. The solid line is 1:1 verification line: <bold>(A)</bold> for total AGB, <bold>(B)</bold> for stem, <bold>(C)</bold> for bark, <bold>(D)</bold> for branch, and <bold>(E)</bold> for leaf.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g009.tif"/>
</fig>
<p>For the experiments of cross-validation, 70% of the samples are randomly selected for model training and left 30% are used for validation; the procedures were performed 10 times, and the averaged values were calculated and summarized in <xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref>. The best performance with the highest <italic>R</italic>
<sup>2</sup> value was selected among these ten instances and graphed in <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref>. According to the results from cross-validation, the performance of SVR algorithms shows worse performance than RF algorithms. For the model training, <italic>R</italic>
<sup>2</sup> values range from 0.70 to 0.74, and rRMSE values range from 20.82% to 27.29%. The <italic>R</italic>
<sup>2</sup> value decreased, whereas the RMSE and rRMSE values increased during testing, with <italic>R</italic>
<sup>2</sup> ranging from 0.50 to 0.65 and rRMSE ranging from 22.29% to 33.08%. When predicting biomass with the SVR model, the accuracy of validation with LOOCV was 0%&#x2013;5% higher than that of validation with the cross-validation method. The scatter plots of total and component AGB estimations show no obvious saturation phenomena. The results in <xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref> revealed that the lower rRMSE values in the model training procedure, the lower rRMSE values in the test procedure.</p>
<table-wrap id="T7" position="float">
<label>Table&#xa0;7</label>
<caption>
<p>The cross-validation method was used to check the accuracy results of the model.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Components</th>
<th valign="middle" colspan="3" align="center">Training set</th>
<th valign="middle" colspan="3" align="center">Test set</th>
</tr>
<tr>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
<th valign="middle" align="center">
<italic>R</italic>
<sup>2</sup>
</th>
<th valign="middle" align="center">RMSE/(t&#x2022;ha<sup>&#x2212;1</sup>)</th>
<th valign="middle" align="center">rRMSE/(%)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Stem biomass</td>
<td valign="middle" align="center">0.74</td>
<td valign="middle" align="center">16.95</td>
<td valign="middle" align="center">27.29</td>
<td valign="middle" align="center">0.54</td>
<td valign="middle" align="center">19.26</td>
<td valign="middle" align="center">33.08</td>
</tr>
<tr>
<td valign="middle" align="center">Bark biomass</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">1.85</td>
<td valign="middle" align="center">23.40</td>
<td valign="middle" align="center">0.65</td>
<td valign="middle" align="center">2.48</td>
<td valign="middle" align="center">28.38</td>
</tr>
<tr>
<td valign="middle" align="center">Branch biomass</td>
<td valign="middle" align="center">0.71</td>
<td valign="middle" align="center">4.37</td>
<td valign="middle" align="center">24.21</td>
<td valign="middle" align="center">0.57</td>
<td valign="middle" align="center">5.87</td>
<td valign="middle" align="center">31.77</td>
</tr>
<tr>
<td valign="middle" align="center">Leaf biomass</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.91</td>
<td valign="middle" align="center">20.82</td>
<td valign="middle" align="center">0.50</td>
<td valign="middle" align="center">0.87</td>
<td valign="middle" align="center">22.29</td>
</tr>
<tr>
<td valign="middle" align="center">Forest AGB</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">22.06</td>
<td valign="middle" align="center">24.04</td>
<td valign="middle" align="center">0.56</td>
<td valign="middle" align="center">30.88</td>
<td valign="middle" align="center">31.41</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>Cross-validation method to test the accuracy of support vector regression models. The solid line is 1:1 verification line. In the figure, the first row shows the performance of the model on the training set. The second row shows the performance of the model on the test set.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g010.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="f11">
<bold>Figure&#xa0;11</bold>
</xref> compares the RMSE and rRMSE values between RF and SVR algorithms using validation of LOOCV and cross-validation. For both RF and SVR, the RMSE values of the model training are lower than that of LOOCV and model testing in total and component AGB estimations. The RMSE values acquired by the LOOCV method for bark and leaf, which has lower AGB levels, showed a bit higher than that acquired at testing procedures of the cross-validation methods. For stem AGB estimation, RMSE values are almost same for LOOCV and cross-validation test procedure using both RF and SVR algorithms. The RMSE values acquired by LOOCV were lower than that acquired at testing procedure. It seemed that the rRMSE values acquired using the LOOCV method for both RF and SVR algorithms were lower or almost same as that acquired during testing procedures but greater than that acquired at model training procedures. Meanwhile, the rRMSE values for forest total biomass and biomass component estimation ranged from 25% to 32.5%. The acquired values using RF were lower than that using SVR algorithms.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Comparison of the RF and SVR estimated results using LOOCV and cross-validation method. <bold>(A)</bold> The validation method for evaluating two models with RMSE. <bold>(B)</bold> The validation method for evaluating two models with rRMSE.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g011.tif"/>
</fig>
</sec>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Forest AGB mapping</title>
<p>By comparing the accuracy of the two machine learning models using two validation methods, the RF model was chosen to perform forest total and component AGB inversion for the LiDAR data covering the study area. The spatial distribution maps of component AGBs are shown in <xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12</bold>
</xref>. The stem AGB (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12A</bold>
</xref>) ranged from 18.23 Mg/ha to 123.56 Mg/ha, bark AGB (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12B</bold>
</xref>) ranged from 2.96 Mg/ha to 16.04 Mg/ha, branch AGB (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12C</bold>
</xref>) ranged from 7.37 Mg/ha to 33.77 Mg/ha, and leaf biomass (<xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12D</bold>
</xref>) ranged from 1.92 Mg/ha to 6.66 Mg/ha.</p>
<fig id="f12" position="float">
<label>Figure&#xa0;12</label>
<caption>
<p>Spatial distribution of biomass component. <bold>(A)</bold> Stem, <bold>(B)</bold> bark, <bold>(C)</bold> branch, and <bold>(D)</bold> leaf.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g012.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="f13">
<bold>Figure&#xa0;13</bold>
</xref> displayed the spatial distribution map of estimated total AGB, which ranged from 35.02 Mg/ha to 180.11 Mg/ha. From <xref ref-type="fig" rid="f9">
<bold>Figures&#xa0;9</bold>
</xref> and <xref ref-type="fig" rid="f10">
<bold>10</bold>
</xref>, the retrieved AGBs seemed consistent with distribution trend of the LiDAR-derived AGB map.</p>
<fig id="f13" position="float">
<label>Figure&#xa0;13</label>
<caption>
<p>Spatial distribution of forest total biomass in the study area.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1258521-g013.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>The feature parameters of machine learning models are not limited by dimensionality, and the inversion of forest total biomass using machine learning models has good robustness when there is multicollinearity between feature variables, effectively avoiding the loss of important parameters while maintaining excellent estimation performance (<xref ref-type="bibr" rid="B21">Kotsiantis et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B11">G&#xf6;rgens et&#xa0;al., 2015</xref>). Therefore, machine learning has been widely used for forest AGB estimation with good accuracy (<xref ref-type="bibr" rid="B5">Cao et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B19">Jiang et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B25">Li et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B40">Torre-Tojal et&#xa0;al., 2022</xref>). In the study by Ji et&#xa0;al. (<xref ref-type="bibr" rid="B17">Ji et&#xa0;al., 2022</xref>), the accuracy of parametric and non-parametric models for estimating the total forest AGB was compared using SAR data, and the results showed that the non-parametric model gave better estimates than the parametric model, and the non-parametric model was more advantageous than the parametric model in the estimation of the total forest AGB. In our study, two non-parametric models, namely, RF and SVR, were constructed using sample AGB and associated LiDAR remote sensing features for forest total AGB and component AGB inversion. The estimation accuracy of the inverse model was tested by the LOOCV and cross-validation methods.</p>
<p>The results of the comparison between the two machine learning models showed that the <italic>R</italic>
<sup>2</sup> value (0.75) of the total biomass estimated by RF was higher than that of SVR when using the LOOCV. This result is consistent with the findings of several studies. For example, the RF and SVR models were compared by G&#xf6;rgens et&#xa0;al. and Kumari and Kumar (<xref ref-type="bibr" rid="B11">G&#xf6;rgens et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B22">Kumari and Kumar, 2023</xref>), and the result was that the RF model outperformed the SVR model in terms of prediction performance. In the work of G&#xf6;rgens et&#xa0;al. (<xref ref-type="bibr" rid="B11">G&#xf6;rgens et&#xa0;al., 2015</xref>), neural network, RF, and SVR models were used to predict stand volume in fast-growing plantation forests, and the RF model produced the best prediction results. The study conducted by Kumari and Kumar (<xref ref-type="bibr" rid="B22">Kumari and Kumar, 2023</xref>) compared the predictive potential of SVR and RF algorithms in predicting forest AGB. The result was that the predictive performance of RF is better than that of SVR in this study. In these studies above, the RF algorithm achieved better prediction results compared with the SVR. This may be due to the fact that RF is better at handling non-linear relationships and that the model requires fewer hyperparameters to be adjusted compared with SVR. On the other hand, SVR requires selecting appropriate kernel functions and tuning hyperparameters based on the characteristics of the dataset. However, this does not imply that RF outperforms SVR in all scenarios. Therefore, the selection of machine learning methods for inversion of forest AGB needs to be evaluated and compared on the basis of a combination of various factors. In addition, the results of our study using RF to estimate component biomass showed that leaf biomass was the least correlated with LiDAR data, with an <italic>R</italic>
<sup>2</sup> value of 0.54. This result is in agreement with He et&#xa0;al. (<xref ref-type="bibr" rid="B13">He et&#xa0;al., 2013</xref>) who used LiDAR data to estimate the summed component AGB of coniferous forests. In their study, a linear regression model was used, and the results also showed weaker performance for leaf AGB estimation but better performance for stem, branch, and total forest biomass estimation. The range of biomass values of leaves is too low, which may be a reason for the weaker relationship.</p>
<p>Height variables extracted from LiDAR data were strongly correlated with the total and component forest AGBs. In this study, height variables change according to the different component of forest AGBs. <italic>H</italic>
<sub>30</sub>, <italic>H</italic>
<sub>40</sub>, and <italic>H</italic>
<sub>sqt</sub> are the optimized height variables for total AGB estimation, and the same variables are selected as optimal features for stem estimation as well. <italic>H</italic>
<sub>30</sub>, <italic>H</italic>
<sub>mean</sub>, and <italic>H</italic>
<sub>8</sub> are the selected optimal height variables for bark AGB estimation, whereas, for branches and leaves, they are <italic>H</italic>
<sub>sqt</sub>, <italic>H</italic>
<sub>mean</sub>, and <italic>H</italic>
<sub>20</sub> and <italic>H</italic>
<sub>10</sub>, <italic>H</italic>
<sub>20</sub>, and <italic>H</italic>
<sub>9</sub>, respectively. The differences in height variables used for biomass estimation of different components indicate that LiDAR-derived height features have varying explanatory capabilities for biomass composition. It may be related to the extracted height characteristics of LiDAR data to the vertical structure of the forest. In addition, multiple correlations among LiDAR characteristic variables and some overlap among cumulative height percentile variables may also be responsible for the large differences in the relative importance ranking of variables in the component biomass models (<xref ref-type="bibr" rid="B16">Hong et&#xa0;al., 2019</xref>). Cao et&#xa0;al. (<xref ref-type="bibr" rid="B4">Cao et&#xa0;al., 2014</xref>) estimated total and component biomass in a subtropical forest using small discrete and full waveform airborne LiDAR data. Although the inversion methods that they used were MLR models, their results also confirmed that the height variables extracted from LiDAR data were highly correlated with total forest biomass and component biomass. Forest height features extracted from small-footprint data (<xref ref-type="bibr" rid="B34">Popescu, 2007</xref>), small-footprint full-wave form data (<xref ref-type="bibr" rid="B14">Hermosilla et&#xa0;al., 2014a</xref>; <xref ref-type="bibr" rid="B15">Hermosilla et&#xa0;al., 2014b</xref>), and large-footprint SLICER data (<xref ref-type="bibr" rid="B8">Drake et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B24">Lefsky et&#xa0;al., 2005</xref>) also explained most of the variability of them for forest structure characteristics.</p>
<p>The comparisons of different validation method are not addressed in other studies, whereas several studies demonstrated that LOOCV performed better especially the limitations of small samples are existent (<xref ref-type="bibr" rid="B48">Zeng et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B37">Shi et&#xa0;al., 2023</xref>). In this study, the validation difference between LOOCV and cross-validation was compared, and the results revealed that LOOCV showed better accuracy for forest stem, bark, stem, branch, and total AGB estimation but worse accuracy for forest leaf AGB estimation. The accuracy here is related to the value of rRMSE.</p>
<p>Compared with the results of studies using different data sources in the same study area, the height features extracted from LiDAR data outperformed than other data sources. Li et&#xa0;al. (<xref ref-type="bibr" rid="B27">Li et&#xa0;al., 2020</xref>) extracted remote sensing features from Landsat8 OLI, Gaofen-1 optical data, and ALOS-1 PALSAR-1SAR to compute forest total biomass at the same test site. They used a fast iterative procedure to optimize input remote sensing features to improve the inversion capability of K-nearest neighbor (KNN) algorithms; the results were validated by LOOCV method; and <italic>R</italic>&#xb2; = 0.63 and RMSE = 28.84 Mg/ha were weaker than the <italic>R</italic>
<sup>2</sup> and RMSE values for estimated total AGB using RF and SVR and LOOCV validation in this study. Zeng et&#xa0;al. estimated total and component forest AGBs using features extracted from synthetic aperture radar and demonstrated that C-band polarimetric features performed best for forest leaf AGB estimation with <italic>R</italic>
<sup>2</sup>&#xa0;=&#xa0;0.637 and RMSE = 1.27 Mg/ha (<xref ref-type="bibr" rid="B48">Zeng et&#xa0;al., 2022</xref>). The estimation of forest total and component AGBs using different data sources revealed the great potential of LiDAR features for accurate estimation.</p>
<p>Although we explored the forest total biomass and biomass component inversion based on optimal LiDAR-derived feature selection with PLSR algorithm and RF and SVR inversion algorithms, there are other machine learning methods that we do not explored in this study. Moreover, the component biomass in this study was calculated by the conversion factors; it may introduce uncertainties for the inversion results; later, the field collected component biomass could be applied in similar study to reduce the uncertainties.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusions</title>
<p>In this study, 56 height-related features extracted from LiDAR were used in RF and SVR algorithms for forest total and component AGB estimation. PLSR algorithm was utilized for ranking and selecting optimal LiDAR-derived features. LOOCV and cross-validation methods were performed to validate the inversion results obtained by RF and SVR. Four cumulative height percentiles (<italic>AIH</italic>
<sub>30</sub>, <italic>AIH</italic>
<sub>40</sub>, <italic>AIH</italic>
<sub>20</sub>, and <italic>AIH</italic>
<sub>25</sub>), two height percentiles (<italic>H</italic>
<sub>8</sub> and <italic>H</italic>
<sub>6</sub>), and four height-related variables (<italic>H</italic>
<sub>mean</sub>, <italic>H</italic>
<sub>sqrt</sub>, <italic>H</italic>
<sub>mad</sub>, and <italic>H</italic>
<sub>curt</sub>) are more sensitive LiDAR-derived features for total and component forest height estimation. RF performed better than SVR for both forest total biomass and biomass component estimation. LOOCV showed better accuracy for forest stem, bark, stem, branch, and total AGB estimation but worse accuracy for forest leaf AGB estimation. Note that the difference between the validation using LOOCV and cross-validation is no more than 5%. The features extracted from LiDAR showed a weak performance for leaf AGB estimation when compared with other component AGBs and total AGB estimation. Because only 56 height-related features and only two machine learning methods were applied in this study, future work should focus on exploring more metrices especially derived from full-waveform LiDAR data and more machine learning methods like KNN and Gaussian processes.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>JM: Methodology, Software, Supervision, Validation, Visualization, Writing &#x2013; original draft. WZ: Conceptualization, Project administration, Resources, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. YJ: Writing &#x2013; original draft, Writing &#x2013; review &amp; editing, Validation, Visualization. JH: Validation, Methodology, Formal Analysis, Writing &#x2013; original draft. GH: Software, Writing &#x2013; original draft. LW: Visualization, Writing &#x2013; original draft.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This work was supported by Yunnan Province agriculture joint special project with grant numbers of 202301BD070001-058 and the National Natural Science Foundation of China with grant numbers of 32160365, 42161059, and 32371869.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>The authors gratefully acknowledge the support of China Scholarship Council (CSC) for this study.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>Author JH is employed by Aisino Xinde Zhitu Beijing Technology Co.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1258521/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1258521/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Asner</surname> <given-names>G. P.</given-names>
</name>
<name>
<surname>Mascaro</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Muller-Landau</surname> <given-names>H. C.</given-names>
</name>
<name>
<surname>Vieilledent</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Vaudry</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Rasamoelina</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>A universal airborne LiDAR approach for tropical forest carbon mapping</article-title>. <source>Oecologia</source> <volume>168</volume>, <fpage>1147</fpage>&#x2013;<lpage>1160</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s00442-011-2165-z</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breidenbach</surname> <given-names>J.</given-names>
</name>
<name>
<surname>N&#xe6;sset</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Lien</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Gobakken</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Solberg</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Prediction of species specific forest inventory attributes using a nonparametric semi-individual tree crown approach based on fused airborne laser scanning and multispectral data</article-title>. <source>Remote Sens. Environ.</source> <volume>114</volume>, <fpage>911</fpage>&#x2013;<lpage>924</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2009.12.004</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Coops</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Hermosilla</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Innes</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>J.</given-names>
</name>
<name>
<surname>She</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Using small-footprint discrete and full-waveform airborne liDAR metrics to estimate total biomass and biomass components in subtropical forests</article-title>. <source>Remote Sens.</source> <volume>6</volume>, <fpage>7110</fpage>&#x2013;<lpage>7135</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs6087110</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Integrating airborne liDAR and optical data to estimate forest aboveground biomass in arid and semi-arid regions of China</article-title>. <source>Remote Sens.</source> <volume>10</volume>, <elocation-id>532</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs10040532</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Hay</surname> <given-names>G. J.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2010</year>). &#x201c;<article-title>Estimation of forest height, biomass and volume using support vector regression and segmentation from lidar transects and Quickbird imagery</article-title>,&#x201d; in <conf-name>2010 18th International Conference on Geoinformatics</conf-name>, <conf-loc>Beijing, China</conf-loc>. <fpage>1</fpage>&#x2013;<lpage>4</lpage> (IEEE). doi:&#xa0;<pub-id pub-id-type="doi">10.1109/GEOINFORMATICS.2010.5567501</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dixon</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Houghton</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Solomon</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Trexler</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Wisniewski</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Carbon pools and flux of global forest ecosystems</article-title>. <source>Sci. New Ser.</source> <volume>263</volume>, <fpage>185</fpage>&#x2013;<lpage>190</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.263.5144.185</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Drake</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Dubayah</surname> <given-names>R. O.</given-names>
</name>
<name>
<surname>Clark</surname> <given-names>D. B.</given-names>
</name>
<name>
<surname>Knox</surname> <given-names>R. G.</given-names>
</name>
<name>
<surname>Blair</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Hofton</surname> <given-names>M. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2002</year>). <article-title>Estimation of tropical forest structural characteristics using large-footprint lidar</article-title>. <source>Remote Sens. Environ.</source> <volume>79</volume>, <fpage>305</fpage>&#x2013;<lpage>319</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0034-4257(01)00281-4</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Drucker</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Burges</surname> <given-names>C. J. C.</given-names>
</name>
<name>
<surname>Kaufman</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Smola</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Vapnik</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Support vector regression machines</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>9</volume>, <fpage>779</fpage>&#x2013;<lpage>784</lpage>.</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gleason</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Im</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Forest biomass estimation from airborne LiDAR data using machine learning approaches</article-title>. <source>Remote Sens. Environ.</source> <volume>125</volume>, <fpage>80</fpage>&#x2013;<lpage>91</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2012.07.006</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>G&#xf6;rgens</surname> <given-names>E. B.</given-names>
</name>
<name>
<surname>Montaghi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rodriguez</surname> <given-names>L. C. E.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A performance comparison of machine learning methods to estimate the fast-growing forest plantation yield based on laser scanning metrics</article-title>. <source>Comput. Electron. Agric.</source> <volume>116</volume>, <fpage>221</fpage>&#x2013;<lpage>227</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.compag.2015.07.004</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Xiao</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Application of remote sensing in forest aboveground biomass estimation</article-title>. <source>Chin. Journal Ecol.</source> <volume>26</volume>, <fpage>1317</fpage>&#x2013;<lpage>1322</lpage>.</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>E.</given-names>
</name>
<name>
<surname>An</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Above-ground biomass and biomass components estimation using liDAR data in a coniferous forest</article-title>. <source>Forests</source> <volume>4</volume>, <fpage>984</fpage>&#x2013;<lpage>1002</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/f4040984</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hermosilla</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Coops</surname> <given-names>N. C.</given-names>
</name>
<name>
<surname>Ruiz</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Moskal</surname> <given-names>L. M.</given-names>
</name>
</person-group> (<year>2014</year>a). <article-title>Deriving pseudo-vertical waveforms from small-footprint full-waveform LiDAR data</article-title>. <source>Remote Sens. Lett.</source> <volume>5</volume>, <fpage>332</fpage>&#x2013;<lpage>341</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/2150704X.2014.903350</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hermosilla</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ruiz</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Kazakova</surname> <given-names>A. N.</given-names>
</name>
<name>
<surname>Coops</surname> <given-names>N. C.</given-names>
</name>
<name>
<surname>Moskal</surname> <given-names>L. M.</given-names>
</name>
</person-group> (<year>2014</year>b). <article-title>Estimation of forest structure and canopy fuel parameters from small-footprint full-waveform LiDAR data</article-title>. <source>Int. J. Wildland Fire</source> <volume>23</volume>, <fpage>224</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1071/WF13086</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Xiang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Pang</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Inversion of biomass components for larix olgensis plantation using airborne liDAR</article-title>. <source>For. Res.</source> <volume>32</volume>, <fpage>83</fpage>&#x2013;<lpage>90</lpage>.</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ji</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Qu</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Forest above ground biomass estimation using airborne P band polarimetric SAR data</article-title>. <source>J. Zhejiang A&amp;F Univ.</source> <volume>39</volume>, <fpage>971</fpage>&#x2013;<lpage>980</lpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jia</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Biomass allocation in relation to stand density in Pinus tabuliformis plantation</article-title>. <source>Journal Nanjing Forest. Univ. (Natural Sci. Edition)</source> <volume>39</volume>, <fpage>87</fpage>&#x2013;<lpage>92</lpage>.</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improving aboveground biomass estimation of natural forests on the Tibetan Plateau using spaceborne LiDAR and machine learning algorithms</article-title>. <source>Ecol. Indic.</source> <volume>143</volume>, <elocation-id>109365</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecolind.2022.109365</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ju</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Inversion of forest aboveground biomass using combination of LiDAR and multispectral data</article-title>. <source>J. Nanjing Forest. Univ. (Natural Sci. Edition)</source> <volume>46</volume>, <fpage>58</fpage>&#x2013;<lpage>68</lpage>.</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kotsiantis</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>Zaharakis</surname> <given-names>I. D.</given-names>
</name>
<name>
<surname>Pintelas</surname> <given-names>P. E.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Machine learning: a review of classification and combining techniques</article-title>. <source>Artif. Intell. Rev.</source> <volume>26</volume>, <fpage>159</fpage>&#x2013;<lpage>190</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10462-007-9052-3</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kumari</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). &#x201c;<article-title>Machine learning based modeling for forest aboveground biomass retrieval</article-title>,&#x201d; in <conf-name>2023 International Conference on Machine Intelligence for GeoAnalytics and Remote Sensing (MIGARS)</conf-name>, <conf-loc>Hyderabad, India</conf-loc>. <fpage>1</fpage>&#x2013;<lpage>4</lpage> (IEEE). doi:&#xa0;<pub-id pub-id-type="doi">10.1109/MIGARS57353.2023.10064607</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lambert</surname> <given-names>M.-C.</given-names>
</name>
<name>
<surname>Ung</surname> <given-names>C.-H.</given-names>
</name>
<name>
<surname>Raulier</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Canadian national tree aboveground biomass equations</article-title>. <source>Can. J. For. Res.</source> <volume>35</volume>, <fpage>1996</fpage>&#x2013;<lpage>2018</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1139/x05-112</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lefsky</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Hudak</surname> <given-names>A. T.</given-names>
</name>
<name>
<surname>Cohen</surname> <given-names>W. B.</given-names>
</name>
<name>
<surname>Acker</surname> <given-names>S. A.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Patterns of covariance between forest stand and canopy structure in the Pacific Northwest</article-title>. <source>Remote Sens. Environ.</source> <volume>95</volume>, <fpage>517</fpage>&#x2013;<lpage>531</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2005.01.004</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Bi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Aboveground biomass estimation in forests with random forest and Monte Carlo-based uncertainty analysis</article-title>. <source>Ecol. Indic.</source> <volume>142</volume>, <elocation-id>109246</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecolind.2022.109246</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Niu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Forest above-ground biomass estimation at plot and tree levels using airborne LiDAR data</article-title>. <source>J. Remote Sens.</source> <volume>19</volume>, <fpage>669</fpage>&#x2013;<lpage>679</lpage>.</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Cui</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Inversion exploration on forest aboveground biomass of optical and SAR data supported by parameter optimization method</article-title>. <source>J. OF Beijing FORESTRY Univ.</source> <volume>42</volume>, <fpage>11</fpage>&#x2013;<lpage>19</lpage>.</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Hao</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Fast leave-one-out cross-validation algorithm for extreme learning machine</article-title>. <source>J. OF SHANGHAL JAOTONG Univ.</source> <volume>45</volume>, <fpage>1140</fpage>&#x2013;<lpage>1145</lpage>.</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Estimating forest structural attributes using UAV-LiDAR data in Ginkgo plantations</article-title>. <source>ISPRS J. Photogram. Remote Sens.</source> <volume>146</volume>, <fpage>465</fpage>&#x2013;<lpage>482</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2018.11.001</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Micha&#x142;owska</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Rapi&#x144;ski</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A review of tree species classification based on airborne liDAR data and applied classifiers</article-title>. <source>Remote Sens.</source> <volume>13</volume>, <elocation-id>353</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13030353</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>N&#xe6;sset</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Gobakken</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Estimation of above- and below-ground biomass across regions of the boreal forest zone using airborne laser</article-title>. <source>Remote Sens. Environ.</source> <volume>112</volume>, <fpage>3079</fpage>&#x2013;<lpage>3090</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2008.03.004</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nie</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Xi</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Above-ground biomass estimation using airborne discrete-return and full-waveform LiDAR data in a coniferous forest</article-title>. <source>Ecol. Indic.</source> <volume>78</volume>, <fpage>221</fpage>&#x2013;<lpage>228</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ecolind.2017.02.045</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Ju</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Jia</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Si</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>LiCHy: the CAF&#x2019;s liDAR, CCD and hyperspectral integrated airborne observation system</article-title>. <source>Remote Sens.</source> <volume>8</volume>, <elocation-id>398</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs8050398</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Popescu</surname> <given-names>S. C.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Estimating biomass of individual pine trees using airborne lidar</article-title>. <source>Biomass Bioenergy</source> <volume>31</volume>, <fpage>646</fpage>&#x2013;<lpage>655</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.biombioe.2007.06.022</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Saatchi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Halligan</surname> <given-names>K.</given-names>
</name>
<name>
<surname>DeSpain</surname> <given-names>D. G.</given-names>
</name>
<name>
<surname>Crabtree</surname> <given-names>R. L.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Estimation of forest fuel load from radar remote sensing</article-title>. <source>IEEE Trans. Geosci. Remote Sens.</source> <volume>45</volume>, <fpage>1726</fpage>&#x2013;<lpage>1740</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/TGRS.2006.887002</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salas</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Ene</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Gregoire</surname> <given-names>T. G.</given-names>
</name>
<name>
<surname>N&#xe6;sset</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Gobakken</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Modelling tree diameter from airborne laser scanning derived variables: A comparison of spatial statistical models</article-title>. <source>Remote Sens. Environ.</source> <volume>114</volume>, <fpage>1277</fpage>&#x2013;<lpage>1285</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2010.01.020</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Marino</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zeng</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>Forest total and component biomass retrieval via GA-SVR algorithm and quad-polarimetric SAR data</article-title>. <source>Int. J. Appl. Earth Observ. Geoinform.</source> <volume>118</volume>, <elocation-id>103275</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jag.2023.103275</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="book">
<person-group person-group-type="author">
<collab>State Forestry Administration of China</collab>
</person-group> (<year>2016</year>a). <source>Tree Biomass Models and Related Parameters to Carbon Accounting for Betula platyphylla</source> (<publisher-loc>Beijing, China</publisher-loc>: <publisher-name>Standards Press of China</publisher-name>).</citation>
</ref>
<ref id="B39">
<citation citation-type="book">
<person-group person-group-type="author">
<collab>State Forestry Administration of China</collab>
</person-group> (<year>2016</year>b). <source>Tree Biomass Models and Related Parameters to Carbon Accounting for Larix gmelinii</source> (<publisher-loc>Beijing, China</publisher-loc>: <publisher-name>Standards Press of China</publisher-name>).</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Torre-Tojal</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bastarrika</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Boyano</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lopez-Guede</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Gra&#xf1;a</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Above-ground biomass estimation from LiDAR data using random forest algorithms</article-title>. <source>J. Comput. Sci.</source> <volume>58</volume>, <elocation-id>101517</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jocs.2021.101517</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tsui</surname> <given-names>O. W.</given-names>
</name>
<name>
<surname>Coops</surname> <given-names>N. C.</given-names>
</name>
<name>
<surname>Wulder</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Marshall</surname> <given-names>P. L.</given-names>
</name>
<name>
<surname>McCardle</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Using multi-frequency radar and discrete-return LiDAR measurements to estimate above-ground biomass and biomass components in a coastal temperate forest</article-title>. <source>ISPRS J. Photogram. Remote Sens.</source> <volume>69</volume>, <fpage>121</fpage>&#x2013;<lpage>133</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.isprsjprs.2012.02.009</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Urbazaev</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Thiel</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Cremer</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Dubayah</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Migliavacca</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Reichstein</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Estimation of forest aboveground biomass and uncertainties by integration of field measurements, airborne LiDAR, and SAR and optical satellite data in Mexico</article-title>. <source>Carbon Balance Manage</source> <volume>13</volume>, <elocation-id>5</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13021-018-0093-5</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaglio Laurin</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Puletti</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Corona</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Papale</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Valentini</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Above ground biomass and tree species richness estimation with airborne lidar in tropical Ghana forests</article-title>. <source>Int. J. Appl. Earth Observ. Geoinform.</source> <volume>52</volume>, <fpage>371</fpage>&#x2013;<lpage>379</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jag.2016.07.008</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vauhkonen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Korpela</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Maltamo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Tokola</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Imputation of single-tree attributes using airborne laser scanning-based height, intensity, and alpha shape metrics</article-title>. <source>Remote Sens. Environ.</source> <volume>114</volume>, <fpage>1263</fpage>&#x2013;<lpage>1276</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2010.01.016</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Five understandings on support vector machine regression</article-title>. <source>HJDM</source> <volume>09</volume>, <fpage>52</fpage>&#x2013;<lpage>59</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.12677/HJDM.2019.92007</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xue</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Iden tification and prediction of aerodynam ic data in flight smulation based on SVR</article-title>. <source>FLIGHT DYNAM.</source> <volume>9</volume>, <fpage>52</fpage>&#x2013;<lpage>59</lpage>.</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Shao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Brisco</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>An improved scheme for rice phenology estimation based on time-series multispectral HJ-1A/B and polarimetric RADARSAT-2 data</article-title>. <source>Remote Sens. Environ.</source> <volume>195</volume>, <fpage>184</fpage>&#x2013;<lpage>201</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2017.04.016</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zeng</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Forest total and component above-ground biomass (AGB) estimation through C- and L-band polarimetric SAR data</article-title>. <source>Forests</source> <volume>13</volume>, <elocation-id>442</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/f13030442</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>E.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Review of methods on estimating forest above ground biomass</article-title>. <source>J. Beijing Forest. Univ.</source> <volume>33</volume>, <fpage>144</fpage>&#x2013;<lpage>150</lpage>.</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Popescu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Nelson</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Lidar remote sensing of forest biomass: A scale-invariant estimation approach using airborne lasers</article-title>. <source>Remote Sens. Environ.</source> <volume>113</volume>, <fpage>182</fpage>&#x2013;<lpage>196</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2008.09.009</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Tian</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Comparison of machine learning algorithms for forest parameter estimations and application for forest quality assessments</article-title>. <source>For. Ecol. Manage.</source> <volume>434</volume>, <fpage>224</fpage>&#x2013;<lpage>234</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.foreco.2018.12.019</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Xuan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Estimating 3D green volume and aboveground biomass of urban forest trees by UAV-lidar</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <elocation-id>5211</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14205211</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>