<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2017.00447</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Using a Structural Root System Model to Evaluate and Improve the Accuracy of Root Image Analysis Pipelines</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Lobet</surname> <given-names>Guillaume</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/131450/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Koevoets</surname> <given-names>Iko T.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/356689/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Noll</surname> <given-names>Manuel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Meyer</surname> <given-names>Patrick E.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Tocquin</surname> <given-names>Pierre</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/131435/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Pag&#x000E8;s</surname> <given-names>Lo&#x000EF;c</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/378082/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>P&#x000E9;rilleux</surname> <given-names>Claire</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/123234/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>InBioS-PhytoSYSTEMS, University of Li&#x000E8;ge</institution> <country>Li&#x000E8;ge, Belgium</country></aff>
<aff id="aff2"><sup>2</sup><institution>Institut f&#x000FC;r Bio-und Geowissenschaften: Agrosphare, Forschungszentrum J&#x000FC;lich</institution> <country>J&#x000FC;lich, Germany</country></aff>
<aff id="aff3"><sup>3</sup><institution>Plant Cell Biology, Swammerdam Institute for Life Sciences, University of Amsterdam</institution> <country>Amsterdam, Netherlands</country></aff>
<aff id="aff4"><sup>4</sup><institution>INRA, Centre d&#x00027;Avignon, UR 1115 PSH</institution> <country>Avignon, France</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Alexander Bucksch, University of Georgia, USA</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Christopher N. Topp, Donald Danforth Plant Science Center, USA; Tony Pridmore, University of Nottingham, UK</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Guillaume Lobet <email>g.lobet&#x00040;fz-juelich.de</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Plant Biophysics and Modeling, a section of the journal Frontiers in Plant Science</p></fn>
<fn fn-type="other" id="fn003"><p>&#x02020;These authors have contributed equally to this work.</p></fn></author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>04</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="collection">
<year>2017</year>
</pub-date>
<volume>8</volume>
<elocation-id>447</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>09</month>
<year>2016</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>03</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2017 Lobet, Koevoets, Noll, Meyer, Tocquin, Pag&#x000E8;s and P&#x000E9;rilleux.</copyright-statement>
<copyright-year>2017</copyright-year>
<copyright-holder>Lobet, Koevoets, Noll, Meyer, Tocquin, Pag&#x000E8;s and P&#x000E9;rilleux</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Root system analysis is a complex task, often performed with fully automated image analysis pipelines. However, the outcome is rarely verified by ground-truth data, which might lead to underestimated biases. We have used a root model, ArchiSimple, to create a large and diverse library of ground-truth root system images (10,000). For each image, three levels of noise were created. This library was used to evaluate the accuracy and usefulness of several image descriptors classically used in root image analysis softwares. Our analysis highlighted that the accuracy of the different traits is strongly dependent on the quality of the images and the type, size, and complexity of the root systems analyzed. Our study also demonstrated that machine learning algorithms can be trained on a synthetic library to improve the estimation of several root system traits. Overall, our analysis is a call to caution when using automatic root image analysis tools. If a thorough calibration is not performed on the dataset of interest, unexpected errors might arise, especially for large and complex root images. To facilitate such calibration, both the image library and the different codes used in the study have been made available to the community.</p>
</abstract>
<kwd-group>
<kwd>image analysis</kwd>
<kwd>root structural model</kwd>
<kwd>benchmarking</kwd>
<kwd>image library</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<contract-num rid="cn001">P7/29</contract-num>
<contract-num rid="cn002">1.B.237.15F</contract-num>
<contract-num rid="cn002">1.A.320.16F</contract-num>
<contract-sponsor id="cn001">Federaal Wetenschapsbeleid<named-content content-type="fundref-id">10.13039/501100002749</named-content></contract-sponsor>
<contract-sponsor id="cn002">Fonds De La Recherche Scientifique - FNRS<named-content content-type="fundref-id">10.13039/501100002661</named-content></contract-sponsor>
<counts>
<fig-count count="7"/>
<table-count count="3"/>
<equation-count count="5"/>
<ref-count count="19"/>
<page-count count="11"/>
<word-count count="5790"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Roots are of utmost importance in the life of plants and hence selection on root systems represents great promise for improving crop tolerance to biotic and abiotic stresses (as reviewed in Koevoets et al., <xref ref-type="bibr" rid="B9">2016</xref>). As such, their quantification is a challenge in many research projects. This quantification is usually two-fold. The first step consists in acquiring images of the root system, either using classic imaging techniques (CCD cameras) or more specialized ones (microCT, X-Ray, fluorescence,&#x02026;). The next step is to analyse the pictures to extract meaningful descriptors of the root system.</p>
<p>To paraphrase the famous Belgian surrealist painter, Ren&#x000E9; Magritte: &#x0201C;Figure <xref ref-type="fig" rid="F1">1A</xref> is not a root system.&#x0201D; Figure <xref ref-type="fig" rid="F1">1A</xref> is an image of a root system and that distinction is important. An image is indeed a two-dimensional representation of an object, which is usually three-dimensional. Nowadays, measurements are generally not performed on the root systems themselves, but on the images, and this raises some issues.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>(A)</bold> Image of a 2-week old maize root system grown in rhizotron. <bold>(B)</bold> Close-up showing overlapping roots. <bold>(C)</bold> Close-up showing crossing roots.</p></caption>
<graphic xlink:href="fpls-08-00447-g0001.tif"/>
</fig>
<p>Image analysis is the acquisition of traits (or descriptors) describing the objects contained in a particular image. In a perfect situation, these descriptors would accurately represent the biological object of the image with negligible deviation from the biological truth (or data). However, in many cases, artifacts might be present in the images so that the representation of the biological object is not accurate anymore. These artifacts might be due to the conditions under which the images were taken or to the object itself. Mature root systems, for instance, are complex branched structures, composed of thousands of overlapping (Figure <xref ref-type="fig" rid="F1">1B</xref>), and crossing segments (Figure <xref ref-type="fig" rid="F1">1C</xref>). These features are likely to impede image analysis and create a gap between the descriptors and the data.</p>
<p>Root image descriptors can be separated into two main categories: morphological and geometrical descriptors. Morphological descriptors refer to the shape of the different root segments forming the root system (Table <xref ref-type="table" rid="T1">1</xref>). They include, among others, the length and diameter of the different roots. For complex root system images, morphological descriptors are difficult to obtain and are prone to error as mentioned above. Geometrical descriptors give the position of the different root segments in space. They summarize the shape of the root system as a whole. The simplest geometrical descriptors are the width and depth of the root system. Since these descriptors are mostly defined by the external envelope of the root system, crossing and overlapping segments have little impact on their estimation and hence they can be considered as relatively errorless. Geometrical descriptors are expected to be loosely linked to the actual root system topology, since identical shapes could be obtained from different root systems (the opposite is true as well). They are usually used in genetic studies, to identify genetic bases of root system shape and soil exploration.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><bold>Root system parameters used as ground-truth data</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Name</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
<th valign="top" align="left"><bold>Unit</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">tot_root_length</td>
<td valign="top" align="left">The cumulative length of all roots</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">tot_1_order_length</td>
<td valign="top" align="left">The cumulative length of all root axes</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">tot_2&#x0002B;_order_length</td>
<td valign="top" align="left">The cumulative length of all lateral roots</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_length</td>
<td valign="top" align="left">The mean first-order roots length</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_length</td>
<td valign="top" align="left">The mean lateral root length</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">n_1_orders</td>
<td valign="top" align="left">The total number of first order roots</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">n_2&#x0002B;_orders</td>
<td valign="top" align="left">The total number of lateral roots</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_density</td>
<td valign="top" align="left">The mean lateral root density: for each first-order root, the number of lateral roots divided by the axis length (total length).</td>
<td valign="top" align="left">mm-1</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_diam</td>
<td valign="top" align="left">The mean diameter of the first-order roots</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_diam</td>
<td valign="top" align="left">The mean diameter of the lateral roots</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_angle</td>
<td valign="top" align="left">The mean insertion angle of the lateral roots</td>
<td valign="top" align="left">&#x000B0;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Several automated analysis tools were designed in the last few years to extract both types of descriptors from root images (Armengaud et al., <xref ref-type="bibr" rid="B1">2009</xref>; Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref>; Pierret et al., <xref ref-type="bibr" rid="B16">2013</xref>; Bucksch et al., <xref ref-type="bibr" rid="B5">2014</xref>). However, the validation of such tools is often incomplete and/or error prone. For technical reasons, the validation is usually performed on a small number of ground-truth images of young root systems. In agreement, most analysis tools are specifically designed for this kind of root systems. In the few cases where validation is performed on large and complex root systems, it is usually not on ground-truth images, but in comparison with previously published tools (measurement of X with tool A compared with the same measurement with tool B). This might seem a reasonable approach, regarding the scarcity of ground-truth images of large root systems. However, the inherent limitations of these tools, such as scale or root system type (fibrous- vs. tap-roots) are often not known. Users might not even be aware that such limitations exist and apply the provided algorithm without further validation on their own images. This can lead to unexpected errors in the final measurements.</p>
<p>One strategy to address the lack of in-depth validation of image analysis pipelines would be to use synthetic images generated by structural root models (models designed to recreate the physical structure and shape of root systems). Many structural root models have been developed, either to model specific plant species (Pag&#x000E8;s et al., <xref ref-type="bibr" rid="B13">1989</xref>), or to be generic (Pag&#x000E8;s et al., <xref ref-type="bibr" rid="B15">2004</xref>, <xref ref-type="bibr" rid="B12">2013</xref>). These models have been repeatedly shown to faithfully represent the root system structure (Pag&#x000E8;s and Pellerin, <xref ref-type="bibr" rid="B14">1996</xref>). In addition, they can provide the ground-truth data for each synthetic root system generated, independently of its complexity. However, they have not been used for validation of image analysis tools (Rell&#x000E1;n-&#x000C1;lvarez et al., <xref ref-type="bibr" rid="B17">2015</xref>), with one exception performed on young seedling unbranched roots (Benoit et al., <xref ref-type="bibr" rid="B2">2014</xref>).</p>
<p>Here we (i) illustrate the use of a structural root model, Archisimple, to systematically analyse and evaluate an image analysis pipeline and (ii) use the model-generated images to improve the estimation of root traits.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and methods</title>
<sec>
<title>Nomenclature used in the paper</title>
<list list-type="simple">
<list-item><p><bold>Ground-truth data</bold>: The real (geometrical and morphometrical) properties of the root system as a biological object. They are determined by either manual tracking of roots or by using the output of simulated root systems.</p></list-item>
<list-item><p><bold>(Image) Descriptor</bold>: Property of the root image. It does not necessarily have a biological meaning.</p></list-item>
<list-item><p><bold>Root axes:</bold> First order roots, directly attached to the shoot.</p></list-item>
<list-item><p><bold>Lateral roots:</bold> Second- (or lower) order roots, attached to another root.</p></list-item>
</list>
</sec>
<sec>
<title>Creation of a root system library</title>
<p>We used the model ArchiSimple, which was shown to allow the generation of a large diversity of root systems with a minimal amount of parameters (Pag&#x000E8;s et al., <xref ref-type="bibr" rid="B12">2013</xref>). To produce a large library of root systems, we ran the model 10,000 times, each time with a random set of parameters (Figure <xref ref-type="fig" rid="F2">2A</xref>). For each simulation, the growth and development of the root system were constrained in two dimensions.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>Overview of the workflow used in this study</bold>. <bold>(A)</bold> Generation of root systems using Archisimple. <bold>(B)</bold> Creation and analysis of root images. <bold>(C)</bold> Use of Random Forest algorithms to better estimate root system ground-truths. <bold>(D)</bold> Illustration of the different noise levels used in the analysis. <bold>(E)</bold> Example of descriptors extracted with RIA-J.</p></caption>
<graphic xlink:href="fpls-08-00447-g0002.tif"/>
</fig>
<p>The simulations were divided into two main groups: fibrous and tap-rooted. For the fibrous simulations, the model generated a random number of root axes and secondary (radial) growth was disabled. For tap-root simulations, only one root axis was produced and secondary growth was enabled (the extent of which was determined by a random parameter).</p>
<p>The root system created in each simulation was stored in a Root System Markup Language (RSML) file. Each RSML file was then read by the RSML Reader plugin from ImageJ to extract ground-truth data for the library (Lobet et al., <xref ref-type="bibr" rid="B10">2015</xref>). These ground-truth data included geometrical and morphological parameters (Table <xref ref-type="table" rid="T1">1</xref>). For each RSML data file, the RSML Reader plugin also created three JPEG images (at a resolution of 300 DPI) for each root system. To simulate one type of image degradation, we added different levels of noise to the images (using the Salt and Pepper Filter in ImageJ) (Figure <xref ref-type="fig" rid="F2">2D</xref>). For each root system, we computed overlapping index as the number of root segments having an overlap with other root segments over the total number of root segments.</p>
</sec>
<sec>
<title>Root image analysis</title>
<p>Each generated image was analyzed using a custom-made ImageJ plugin, Root Image Analysis-J (or RIA-J). For each image, we extracted a set of classical root image descriptors, such as the total root length, the projected area, and the number of visible root tips (Figure <xref ref-type="fig" rid="F2">2E</xref>). In addition, we included shape descriptors such as the convex-hull area or the exploration ratio (see Supplemental File <xref ref-type="supplementary-material" rid="SM3">1</xref> for details of RIA-J). The list of traits and algorithms used by our pipeline is listed in Table <xref ref-type="table" rid="T2">2</xref>. Distribution of the different descriptors is given in the Supplemental Figure <xref ref-type="supplementary-material" rid="SM2">2</xref>.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p><bold>Root image descriptors extracted by RIA-J</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Name</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
<th valign="top" align="left"><bold>Unit</bold></th>
<th valign="top" align="left"><bold>Reference</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="4" style="background-color:#bbbdc0"><bold>MORPHOLOGY</bold></td>
</tr>
<tr>
<td valign="top" align="left">area</td>
<td valign="top" align="left">Projected area of the root system</td>
<td valign="top" align="left">mm<sup>2</sup></td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
<tr>
<td valign="top" align="left">length</td>
<td valign="top" align="left">Length of the skeleton of the root system image</td>
<td valign="top" align="left">mm</td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
<tr>
<td valign="top" align="left">tip_count</td>
<td valign="top" align="left">Number of end branches in the root system skeleton</td>
<td valign="top" align="left">&#x02013;</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">diam_mean</td>
<td valign="top" align="left">Mean diameter of the root object in the image</td>
<td valign="top" align="left">mm</td>
<td/>
</tr>
<tr>
<td valign="top" align="left" colspan="4" style="background-color:#bbbdc0"><bold>GEOMETRY</bold></td>
</tr>
<tr>
<td valign="top" align="left">width</td>
<td valign="top" align="left">The maximal width of the root system</td>
<td valign="top" align="left">mm</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">depth</td>
<td valign="top" align="left">The maximal depth of the root system</td>
<td valign="top" align="left">mm</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">width_depth_ratio</td>
<td valign="top" align="left">Ratio between the width and the depth of the root system</td>
<td valign="top" align="left">&#x02013;</td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
<tr>
<td valign="top" align="left">com_x&#x02013;com_y</td>
<td valign="top" align="left">Relative coordinates of the center of mass of the root system</td>
<td valign="top" align="left">&#x02013;</td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
<tr>
<td valign="top" align="left">convexhull</td>
<td valign="top" align="left">Area of the smallest convex shape encapsulating the root system</td>
<td valign="top" align="left">mm<sup>2</sup></td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
<tr>
<td valign="top" align="left">exploration</td>
<td valign="top" align="left">Ratio between the convex hull area and the projected area</td>
<td valign="top" align="left">&#x02013;</td>
<td valign="top" align="left">Galkovskyi et al., <xref ref-type="bibr" rid="B7">2012</xref></td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Data analysis</title>
<p>Data analysis was performed in R (R Core Team)<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref>. Plots were created using <italic>ggplot2</italic> (Wickham, <xref ref-type="bibr" rid="B19">2009</xref>) and <italic>lattice</italic> (Sarkar, <xref ref-type="bibr" rid="B18">2008</xref>).</p>
<p>The Mean Relative Errors (MRE) were estimated using the equation:</p>
<disp-formula id="E1"><mml:math id="M1"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mi>M</mml:mi><mml:mi>R</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:msubsup><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msubsup></mml:mstyle><mml:mfrac><mml:mrow><mml:mo>|</mml:mo><mml:msub><mml:mrow><mml:mover accent="false" class="mml-overline"><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mo accent="true">&#x000AF;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>&#x000A0;</mml:mo><mml:mo>-</mml:mo><mml:mo>&#x000A0;</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mover accent="false" class="mml-overline"><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mo accent="true">&#x000AF;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>where <italic>n</italic> is the number of observations, <inline-formula><mml:math id="M2"><mml:msub><mml:mrow><mml:mover accent="false" class="mml-overline"><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mo accent="true">&#x000AF;</mml:mo></mml:mover></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> is the ground-truth and <italic>y</italic><sub><italic>i</italic></sub> is the estimated ground-truth.</p>
</sec>
<sec>
<title>Random forest framework</title>
<p>A <italic>random forest</italic> is a state-of-the-art machine learning algorithm typically used for making new predictions (in both classification and regression tasks). Random Forests can perform non-linear predictions and, thus, often outperform linear models. Since its introduction by Breiman (<xref ref-type="bibr" rid="B4">2001</xref>), Random Forests have been widely used in many fields from gene regulatory network inference to generic image classification (Huynh-Thu et al., <xref ref-type="bibr" rid="B8">2013</xref>; Mar&#x000E9;e et al., <xref ref-type="bibr" rid="B11">2016</xref>). Random Forest relies on growing a multitude of decision trees, a prediction algorithm that has shown good performances by itself but, when combined with other decision trees (hence the name forest), returns predictions that are much more robust to outliers and noisy data (see bootstrap aggregating, Breiman, <xref ref-type="bibr" rid="B3">1996</xref>).</p>
<p>In a machine learning setting one is given a set <italic>D</italic> &#x0003D; {(<italic>x</italic><sub>1</sub>, <italic>y</italic><sub>1</sub>), (<italic>x</italic><sub>2</sub>, <italic>y</italic><sub>2</sub>), &#x02026;, (<italic>x</italic><sub><italic>n</italic></sub>, <italic>y</italic><sub><italic>n</italic></sub>)},</p>
<p>where <inline-formula><mml:math id="M3"><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>&#x02026;</mml:mo><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>s</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> is an element of a <italic>s</italic>&#x02212;dimensional <italic>feature space X</italic>,</p>
<p>and <inline-formula><mml:math id="M4"><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:mo>&#x02026;</mml:mo><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula> an element of a <italic>t</italic>&#x02212;dimensional <italic>response space Y</italic>.</p>
<p>The learning task is to find a model</p>
<disp-formula id="E2"><mml:math id="M5"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mi>M</mml:mi><mml:mo>:</mml:mo><mml:mi>X</mml:mi><mml:mo>&#x02192;</mml:mo><mml:mi>Y</mml:mi></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>that predicts the data in a good way, where goodness is measured with regard to an error function <italic>L</italic>.</p>
<p>A decision tree <italic>T</italic><sub><italic>D</italic></sub> is a machine learning method that, for a dataset <italic>D</italic>, constructs a binary tree with each node representing a binary question and each leaf a value of the response space. In other words, a prediction can be made from an input value by looking at the set of binary questions that leads to a leaf (e.g., is the first-order root bigger than q1 and if yes is the number of second-order roots smaller than q2 and if no, &#x02026;).</p>
<p>Each decision is based upon exactly one feature and is used for deciding which branch of the tree a given input value must take. Hence a decision tree splits successively the set <italic>D</italic> into smaller subsets and assigns them a value <italic>y</italic><sub><italic>i</italic></sub> &#x0003D; <italic>T</italic><sub><italic>D</italic></sub>(<italic>x</italic><sub><italic>i</italic></sub>) of the response space.</p>
<p>The choice of the feature used for splitting depends on a relevance criterion. In our setting, the default relevance criterion from the randomForest R package (CRAN randomForest, <xref ref-type="bibr" rid="B6">2015</xref>), namely the Gini index, has been used.</p>
<p>A Random Forest</p>
<disp-formula id="E3"><label>(1)</label><mml:math id="M6"><mml:mtable class="eqnarray" columnalign="right center left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>T</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi><mml:mo>,</mml:mo><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mo>&#x000A0;</mml:mo><mml:mo>&#x02208;</mml:mo><mml:mo>&#x000A0;</mml:mo><mml:mi>I</mml:mi></mml:mrow></mml:msub><mml:mo>&#x000A0;</mml:mo><mml:mtext>where</mml:mtext><mml:mo>&#x000A0;</mml:mo><mml:mi>I</mml:mi><mml:mo>&#x000A0;</mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mn>2</mml:mn><mml:mo>,</mml:mo><mml:mo>&#x02026;</mml:mo><mml:mo>.</mml:mo><mml:mi>l</mml:mi></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>consists of <italic>l</italic> decision trees <italic>T</italic><sub><italic>D, k</italic></sub>, where several key parameters such as the feature space, are chosen randomly (hence the word Random in the algorithm name). While using a random subspace strongly accelerates the growth of a single tree, it can also decrease its accuracy. However, the use of large number of trees counterbalance advantageously those two effects. The final prediction for each input value <italic>x</italic><sub><italic>i</italic></sub> corresponds to the majority vote of all the decision trees of the forest <italic>T</italic><sub><italic>D, k</italic></sub>(<italic>x</italic><sub><italic>i</italic></sub>) in a classification setting while an average of all predicted values is used in a regression task.</p>
<sec>
<title>Framework description</title>
<p>Our method consists of three typical steps:
<list list-type="order">
<list-item><p>A preprocessing step, where we replace missing values of the training set.</p></list-item>
<list-item><p>A model generation step where, for each response variable, we generate different models according to two Random Forest parameters (number of trees and number of splits).</p></list-item>
<list-item><p>A model selection step, where we choose the best performing pair of parameters of the previous step for each one of the response variable.</p></list-item>
</list></p>
</sec>
<sec>
<title>Preprocessing</title>
<p>Missing values in our dataset might arise due to highly noisy images, where the measurement of certain descriptors has been infeasible. To deal with this issue, we first replaced missing values.</p>
<p>This is done using the imputation function of the randomForest R package. It replaces all missing values of a response variable by the median and then a Random Forest is applied on the completed data to predict a more accurate value. We favored 10 trees for computing the new value over the default value of 300 as we found that it offered sufficiently accurate results for our application while being much faster.</p>
</sec>
<sec>
<title>Model generation</title>
<p>In the model generation step, for each of the response variables, several forests with different number of trees and different number of splits (<italic>t</italic><sub><italic>i</italic></sub>, <italic>m</italic><sub><italic>j</italic></sub>) are tested. In practice, the training set <italic>D</italic><sub><italic>train</italic></sub> is divided into <italic>m</italic><sub><italic>j</italic></sub> disjunct subsets <inline-formula><mml:math id="M7"><mml:msubsup><mml:mrow><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>m</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:math></inline-formula> and on each of those, a Random Forest <inline-formula><mml:math id="M8"><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>m</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:msub></mml:math></inline-formula> is trained on a growing number of <italic>t</italic><sub><italic>i</italic></sub> random trees.</p>
</sec>
<sec>
<title>Model selection</title>
<p>Given a new data point <italic>x</italic>, each model predicts a response variable <italic>y</italic> by averaging the predicted values <inline-formula><mml:math id="M9"><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>, i.e.,</p>
<disp-formula id="E4"><mml:math id="M10"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mo>&#x00177;</mml:mo><mml:mo>&#x000A0;</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x000A0;</mml:mo><mml:msubsup><mml:mrow><mml:mi>M</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mo>,</mml:mo><mml:mi>m</mml:mi></mml:mrow></mml:msubsup><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:mfrac><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>k</mml:mi><mml:mo>&#x000A0;</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x000A0;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>F</mml:mi></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>D</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>r</mml:mi><mml:mi>a</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Then in a final step an estimate of the root-mean-square (RMSE) generalized error on the test set <italic><bold>D</bold></italic><sub><italic><bold>t</bold>est</italic></sub> is computed, where RSME is defined as</p>
<disp-formula id="E5"><mml:math id="M11"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mrow><mml:mi>R</mml:mi><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>&#x02009;</mml:mo><mml:mo>=</mml:mo><mml:mo>&#x02009;</mml:mo><mml:mstyle displaystyle='true'><mml:munderover><mml:mo>&#x02211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mrow><mml:msqrt><mml:mrow><mml:msup><mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x000AF;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mo>)</mml:mo></mml:mrow></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:mstyle></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>for <italic><bold>D</bold></italic><sub><italic><bold>t</bold>est</italic></sub>={(x<sub>1</sub>,y<sub>1</sub>),(x<sub>2</sub>,y<sub>2</sub>),&#x02026;,(x<sub>n</sub>,y<sub>n</sub>)}.</p>
<p>Finally, the model with the parameter pair (<italic>t</italic>,<italic>m</italic>) having the minimal error (on the separate test set) is chosen in order to make the predictions.</p>
</sec>
</sec>
<sec>
<title>Data availability</title>
<p>All data used in this paper (including the image and RSML libraries) are available at the address <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.5281/zenodo.208214">http://doi.org/10.5281/zenodo.208214</ext-link></p>
<p>An archived version of the codes used in this paper is available at the address <ext-link ext-link-type="uri" xlink:href="http://doi.org/10.5281/zenodo.208499">http://doi.org/10.5281/zenodo.208499</ext-link></p>
<p>An archived version of the machine learning framework is available at the address <ext-link ext-link-type="uri" xlink:href="https://github.com/FaustFrankenstein/RandomForestFramework/releases/tag/v1.0">https://github.com/FaustFrankenstein/RandomForestFramework/releases/tag/v1.0</ext-link></p>
</sec>
</sec>
<sec id="s3">
<title>Results and discussions</title>
<sec>
<title>Production of a large library of ground-truth root system images</title>
<p>We combined existing tools into a single pipeline to produce a large library of ground-truth root system images. The pipeline combines a root model (ArchiSimple, Pag&#x000E8;s et al., <xref ref-type="bibr" rid="B12">2013</xref>), the Root System Markup Language (RSML) and the RSML Reader plugin from ImageJ (Lobet et al., <xref ref-type="bibr" rid="B10">2015</xref>). In short, ArchiSimple was used to create a large number of root systems, based on random input parameter sets. Each output was stored as an RSML file (Figure <xref ref-type="fig" rid="F2">2A</xref>), which was then used by the RSML Reader plugin to create a graphical representation of the root system (as a. jpeg file) and a ground-truth dataset (Figure <xref ref-type="fig" rid="F2">2B</xref>). Details about the different steps are presented in the Materials and Methods section.</p>
<p>We used the pipeline to create a library of 10,000 root system images, separated into fibrous (multiple first order roots and no secondary growth) and tap-root systems (one first order root and secondary growth). The ranges of the different ground-truth data are shown in Table <xref ref-type="table" rid="T3">3</xref> and their distribution is shown in the Supplemental Figure <xref ref-type="supplementary-material" rid="SM1">1</xref>.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p><bold>Ranges of the different ground-truth data from the root systems generated using ArchiSimple</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Variable</bold></th>
<th valign="top" align="center"><bold>Minimum value</bold></th>
<th valign="top" align="center"><bold>Maximum value</bold></th>
<th valign="top" align="left"><bold>Unit</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="4" style="background-color:#bbbdc0"><bold>FIBROUS</bold></td>
</tr>
<tr>
<td valign="top" align="left">tot_root_length</td>
<td valign="top" align="center">110</td>
<td valign="top" align="center">73971</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">width</td>
<td valign="top" align="center">0.76</td>
<td valign="top" align="center">302</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">depth</td>
<td valign="top" align="center">50</td>
<td valign="top" align="center">505</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">n_1_order</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">20</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">tot_1_order_length</td>
<td valign="top" align="center">79</td>
<td valign="top" align="center">5409</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_length</td>
<td valign="top" align="center">27</td>
<td valign="top" align="center">470</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_diameter</td>
<td valign="top" align="center">0.2</td>
<td valign="top" align="center">0.4</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_density</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">5</td>
<td valign="top" align="left">root/mm</td>
</tr>
<tr>
<td valign="top" align="left">n_2&#x0002B;_orders</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">4448</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">tot_2&#x0002B;_order_length</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">71556</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_length</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">50</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_diameter</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0.3</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_angle</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">88</td>
<td valign="top" align="left">&#x000B0;</td>
</tr>
<tr>
<td valign="top" align="left" colspan="4" style="background-color:#bbbdc0"><bold>TAP ROOTED</bold></td>
</tr>
<tr>
<td valign="top" align="left">tot_root_length</td>
<td valign="top" align="center">78</td>
<td valign="top" align="center">41870</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">width</td>
<td valign="top" align="center">0.1</td>
<td valign="top" align="center">173</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">depth</td>
<td valign="top" align="center">55</td>
<td valign="top" align="center">505</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">n_1_order</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">tot_1_order_length</td>
<td valign="top" align="center">59</td>
<td valign="top" align="center">509</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_length</td>
<td valign="top" align="center">59</td>
<td valign="top" align="center">509</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_1_order_diameter</td>
<td valign="top" align="center">0.2</td>
<td valign="top" align="center">16</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_density</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">2.3</td>
<td valign="top" align="left">root/mm</td>
</tr>
<tr>
<td valign="top" align="left">n_2&#x0002B;_orders</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">3353</td>
<td valign="top" align="left">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">tot_2&#x0002B;_order_length</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">40225</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_length</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">51</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_diameter</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">2.2</td>
<td valign="top" align="left">mm</td>
</tr>
<tr>
<td valign="top" align="left">mean_2&#x0002B;_order_angle</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">97</td>
<td valign="top" align="left">&#x000B0;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>We started by evaluating whether fibrous and tap-root systems should be separated during the analysis. We performed a Principal Component Analysis on the ground-truth dataset to reduce its dimensionality and assess if the <italic>type</italic> grouping influenced the overall dataset structure (Figure <xref ref-type="fig" rid="F3">3A</xref>). Fibrous and tap-root systems formed distinct groups (MANOVA <italic>p</italic> &#x0003C; 0.001), with limited overlap. The first principal component, which represented 30.9% of the variation within the dataset, was mostly influenced by the number of first-order axes. The second principal component (19.1% of the variation) was influenced, in part, by the root diameters. These two effects were consistent with the clear root system type grouping, since they expressed the main difference between the two groups of root-system <italic>types</italic>. Therefore, since the <italic>type</italic> grouping had such a strong effect on the overall structure, we decided to separate them for the following analyses.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p><bold>(A)</bold> Principal Component Analysis of the root ground-truth dataset. Images of the selected root systems have been added for illustration. <bold>(B)</bold> Loadings of the Principal Component Analysis.</p></caption>
<graphic xlink:href="fpls-08-00447-g0003.tif"/>
</fig>
<p>To demonstrate the utility of a synthetic library of ground-truth root systems, we analyzed every image of the library using a custom-built root image analysis tool, RIA-J. We decided to do so since our purpose was to test the usefulness of the synthetic analysis and not to assess the accuracy of existing tools. Nonetheless, RIA-J was designed using known and published algorithms, often used in root system quantification. A detailed description of RIA-J can be found in the Materials and Methods section and Supplemental File <xref ref-type="supplementary-material" rid="SM1">1</xref>.</p>
<p>We extracted 10 descriptors from each root system image (Table <xref ref-type="table" rid="T2">2</xref>) and compared them with the ground-truth data. For each pair of descriptor-data, we performed a linear regression and computed its r-squared value. Different types of information are highlighted in Figure <xref ref-type="fig" rid="F4">4</xref>. First, using a ground-truth image library allows for a quick and systematic analysis of all the descriptors extracted by the image analysis pipeline. Second, it allows researchers to identify which traits can be accurately evaluated (or not) and by which descriptors. Third, for some ground-truth data, such as the mean length of second order roots or the number of first order roots, it shows that none of the classical descriptors gave a good estimation (Figure <xref ref-type="fig" rid="F4">4</xref>, highlighted with arrows). Finally, the figure highlights that some correlations were different for fibrous- and tap-root systems. As an example, the correlation found between the <italic>mean_2</italic>&#x0002B;<italic>_order_diameter</italic> and <italic>diam_mean</italic> estimators was better for fibrous roots than within the tap-root dataset. Consequently, validation of the different image analysis algorithms should be performed, at least, for each group. An algorithm giving good results for a fibrous root system might fail when applied to tap-rooted ones.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p><bold>Heatmap of the r-squared values between the different image descriptors and the ground-truth values, for the images without any noise</bold>. Black represents an r-squared value of 1; white represents a value of 0. Upper panel: fibrous root dataset. Lower panel: tap-root dataset. Arrows highlight the ground-truth data that cannot be accurately described with the different descriptors. The arrows were doubled when it was the case for both fibrous and tap-rooted root systems.</p></caption>
<graphic xlink:href="fpls-08-00447-g0004.tif"/>
</fig>
</sec>
<sec>
<title>Errors from image descriptors are likely to be non-linear across root system sizes and image qualities</title>
<p>In addition to being related to the species of study, estimation errors are likely to increase with the root system size. As the root system grows and develops, the number of crossing and overlapping segments increases (Figure <xref ref-type="fig" rid="F5">5A</xref>), making the subsequent image analysis potentially more difficult and prone to error. However, a systematic analysis of such error is seldom performed.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p><bold>Error estimation for three ground-truth parameters</bold>. <bold>(A)</bold> Evolution of the overlap index (proportion of root overlapping) with the root system size. <bold>(B&#x02013;D)</bold> Left panel shows the relationship between the descriptors and the corresponding ground-truth variables. Right panels show the evolution of the Mean Relative Error (MRE) as a function of the overlap index. For the MRE calculations, the continuous variables were discretized in groups. <bold>(B)</bold> Number of lateral roots. <bold>(C)</bold> Total root length. <bold>(D)</bold> Root system depth. In the left panels, the gray line indicates the diagonal (1:1 relation).</p></caption>
<graphic xlink:href="fpls-08-00447-g0005.tif"/>
</fig>
<p>Estimation errors are also likely to increase as the image quality decreases. Here we artificially added one type of noise (random &#x0201C;salt and pepper&#x0201D; particles) to the images, with two intensity levels. It should be noted that virtually any type of image degradation could be added to the original images using custom image filters (e.g., using ImageJ). Different types of degradation are expected to generate different levels of estimation errors.</p>
<p>Figure <xref ref-type="fig" rid="F5">5</xref> shows the relationship between the ground-truth and descriptor values for three parameters: the total root length (Figure <xref ref-type="fig" rid="F5">5B</xref>), the number of roots (Figure <xref ref-type="fig" rid="F5">5C</xref>), and the root system depth (Figure <xref ref-type="fig" rid="F5">5D</xref>). For each of these variables, we quantified the Mean Relative Error (see Materials and Methods for details) as a function of the overlap index. This was done for three levels of noise added to the images (&#x0201C;null,&#x0201D; &#x0201C;medium,&#x0201D; and &#x0201C;high&#x0201D;). We can observe that for the estimation of both the total root length and the number of lateral roots, the Mean Relative Error increased with the size of the root system (Figures <xref ref-type="fig" rid="F5">5B&#x02013;C</xref>). As stated above, such increase of the error was somehow expected with increasing complexity. Moreover, depending on the metric of interest, such as the number of root tips, low image quality can result in high level of error. For other traits, such as the root system depth, no errors were expected (<italic>depth</italic> is supposedly an error-less variable) and the Mean Relative Error was close to 0 whatever the size of the root system and image quality.</p>
<p>The results presented here are tightly dependent on the specific algorithms used for image analysis and hence might be different for other published tools. However, they are a call for caution when analyzing root images: unexpected errors in ground-truth estimation can arise. Our image library can be used to better identify the errors generated by other analysis tools, current or future.</p>
</sec>
<sec>
<title>Roadmap for root image analysis tools calibration</title>
<p>To improve the calibration and validation of future root image analysis tools, we propose the following procedure:
<list list-type="order">
<list-item><p>Develop the new root image analysis pipeline;</p></list-item>
<list-item><p>Use it to analyse the images from the synthetic root library described here;</p></list-item>
<list-item><p>Compare the results from the new analysis with the corresponding ground-truth;</p></list-item>
<list-item><p>Identify, and clearly state, the type of root systems for which the pipeline works accurately;</p></list-item>
<list-item><p>When releasing the new pipeline, inform the users about the possible errors identified.</p></list-item>
</list></p>
</sec>
<sec>
<title>Using the synthetic library to train machine learning algorithms</title>
<p>The main advantage of creating a synthetic library is to generate paired datasets of image descriptors and their corresponding ground-truth values. Having information on both can, in theory, be used to either calibrate the image analysis pipeline or to identify the best descriptors for the ground-truth traits of interest. Here, we explored the second approach and used a Random Forest algorithm to find which combination of descriptors would best describe each ground-truth data (see Material and Methods for details). In short, we randomly divided the whole dataset into training (3/4) and testing subsets (1/4). The training set was used to create a Random Forest model for each ground-truth data, which was then we applied to the test set. The accuracy of these new predictions was then compared to the accuracy of the direct method (single descriptors) (Figure <xref ref-type="fig" rid="F2">2C</xref>).</p>
<p>Figure <xref ref-type="fig" rid="F6">6</xref> shows the comparison of the accuracy (both the r-squared values from linear regressions and the Mean Relative Error, MRE) of both methods for each ground-truth data. We can clearly see that the Random Forest approach performed always better (sometimes substantially) than the direct approach, even for images with high level of noise. In addition, for most traits, the r-squared and MRE values were above 0.9 and below 0.1 respectively, which is very good, especially for such a wide range of images. In addition, the Random Forest approach allowed the correct estimation of traits that were difficult to estimate with the direct approach (such as the number of first-order axes or the mean second-order root density).</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p><bold>Comparison between the direct trait and the Random Forest approach, for the different root system types and the different levels of noise</bold>. For each metric, we computed both the r-squared value from the linear regression between the estimation and the ground-truth (left panels), as well as the Mean Relative Error (right panel). The gray points represent the values obtained with the direct estimation (best descriptor, no noise). Color points represent the values obtained with the Random Forest approach, for different levels of noise. The dotted lines show the 0.9 (r-squared) and 0.1(MRE) thresholds.</p></caption>
<graphic xlink:href="fpls-08-00447-g0006.tif"/>
</fig>
<p>Figure <xref ref-type="fig" rid="F7">7</xref> shows the detailed comparison of both methods for the estimation of the total root length. Again, a clear improvement was visible with the Random Forest method, leading to small errors, even with large root systems and noisy images.</p>
<fig id="F7" position="float">
<label>Figure 7</label>
<caption><p><bold>Comparison between the direct trait estimation and the Random Forest approach, for the different root system types and the different levels of noise</bold>. <bold>(A)</bold> Comparison, for the total root length, of the accuracy of both approaches. The dotted line represents the diagonal. The plain line represents the linear regression. <bold>(B)</bold> Same, for the number of roots.</p></caption>
<graphic xlink:href="fpls-08-00447-g0007.tif"/>
</fig>
<p>Here we presented how machine learning algorithms (Random Forest), could be used in combination with a synthetic image library to improve the estimation of root system traits. Although both the training and test datasets used were made of synthetic images, we believe this approach presents an interesting perspective for the analysis of experimental images.</p>
<p>Indeed, a root architectural model can be used to build a custom library of synthetic images from a set of parameters evaluated on a small number of plants from the experimental dataset. Such library could then be used to train the machine learning model which, in turn, will enable the automatic evaluation of root traits from the remaining experimental images. Alternatively, the algorithm could be directly trained on a subset of experimental data obtained by manual or semi-automatic analyses to be then automatically applied to the rest of the dataset. One must keep in mind that the output of the machine learning strongly depends upon the quality of the dataset used for its training and hence must be analyzed carefully.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="s4">
<title>Conclusions</title>
<p>The automated analysis of root system images is routinely performed in many research projects. Here we used a library of 10,000 synthetic images to estimate the accuracy and usefulness of different image descriptors extracted with a homemade root image analysis pipeline. Our study highlighted some limitations and biases of the image analysis process.</p>
<p>We found that the type of root system (fibrous vs. tap-rooted), its size and complexity, as well as the quality of the images had a strong influence on the accuracy of some commonly used image descriptors and their meaning and relevance for ground-truth extraction. So far, a large proportion of the root research has been focused on seedlings with small root systems and has <italic>de facto</italic> avoided such errors.</p>
<p>However, as the research questions are likely to focus more on mature root systems in the future, these limitations will become critical. We showed that synthetic datasets can be used for calibration or modeling (machine learning) steps that allow ground-truth extraction from comparable images. We then hope that our library will be helpful for the root research community to evaluate and improve other image analysis pipelines.</p>
</sec>
<sec id="s5">
<title>Author contributions</title>
<p>GL, LP, PT, IK, MN, and CP designed the study. IK developed the image analysis pipeline RIA-J. MN and PM developed the Random Forest framework. GL generated the image library and did the data analysis. LP developed the Archisimple model. All authors have participated in the writing of the manuscript.</p>
</sec>
<sec id="s6">
<title>Funding</title>
<p>This research was funded by the Interuniversity Attraction Poles Programme initiated by the Belgian Science Policy Office, P7/29. GL and MN are grateful to the F.R.S.-FNRS for a postdoctoral research grant (1.B.237.15F) and doctoral grant (1.A.320.16F), respectively.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<sec sec-type="supplementary-material" id="s7">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fpls.2017.00447/full#supplementary-material">http://journal.frontiersin.org/article/10.3389/fpls.2017.00447/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image1.TIFF" id="SM1" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplemental Figure 1</label>
<caption><p><bold>Distribution of the properties of the modeled root images</bold>.</p></caption></supplementary-material>
<supplementary-material xlink:href="Image2.TIFF" id="SM2" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplemental Figure 2</label>
<caption><p><bold>Distribution of the descriptors of the modeled root images</bold>.</p></caption></supplementary-material>
<supplementary-material xlink:href="DataSheet1.PDF" id="SM3" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplemental File 1</label>
<caption><p><bold>Definitions of the different descriptors extracted by RIA-J</bold>.</p></caption></supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armengaud</surname> <given-names>P.</given-names></name> <name><surname>Zambaux</surname> <given-names>P.</given-names></name> <name><surname>Hills</surname> <given-names>A.</given-names></name> <name><surname>Sulpice</surname> <given-names>R.</given-names></name> <name><surname>Pattison</surname> <given-names>R. J.</given-names></name> <name><surname>Blatt</surname> <given-names>M. R.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>EZ-Rhizo: integrated software for the fast and accurate measurement of root system architecture</article-title>. <source>Plant J.</source> <volume>57</volume>, <fpage>945</fpage>&#x02013;<lpage>956</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-313X.2008.03739.x</pub-id><pub-id pub-id-type="pmid">19000163</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benoit</surname> <given-names>L.</given-names></name> <name><surname>Rousseau</surname> <given-names>D.</given-names></name> <name><surname>Belin</surname> <given-names>&#x000C9;.</given-names></name> <name><surname>Demilly</surname> <given-names>D.</given-names></name> <name><surname>Chapeau-Blondeau</surname> <given-names>F.</given-names></name></person-group> (<year>2014</year>). <article-title>Simulation of image acquisition in machine vision dedicated to seedling elongation to validate image processing root segmentation algorithms</article-title>. <source>Comput. Electron. Agric.</source> <volume>104</volume>, <fpage>84</fpage>&#x02013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1016/j.compag.2014.04.001</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname> <given-names>L.</given-names></name></person-group> (<year>1996</year>). <article-title>Bagging predictors</article-title>. <source>Mach. Learn.</source> <volume>24</volume>, <fpage>123</fpage>&#x02013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1007/BF00058655</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname> <given-names>L.</given-names></name></person-group> (<year>2001</year>). <article-title>Random Forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x02013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bucksch</surname> <given-names>A.</given-names></name> <name><surname>Burridge</surname> <given-names>J.</given-names></name> <name><surname>York</surname> <given-names>L. M.</given-names></name> <name><surname>Das</surname> <given-names>A.</given-names></name> <name><surname>Nord</surname> <given-names>E.</given-names></name> <name><surname>Weitz</surname> <given-names>J. S.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Image-based high-throughput field phenotyping of crop roots</article-title>. <source>Plant Physiol</source>. <volume>166</volume>, <fpage>470</fpage>&#x02013;<lpage>486</lpage>. <pub-id pub-id-type="doi">10.1104/pp.114.243519</pub-id><pub-id pub-id-type="pmid">25187526</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="web"><person-group person-group-type="author"><collab>CRAN randomForest</collab></person-group> (<year>2015</year>). Available online at: <ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/web/packages/randomForest/randomForest.pdf">https://cran.r-project.org/web/packages/randomForest/randomForest.pdf</ext-link></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Galkovskyi</surname> <given-names>T.</given-names></name> <name><surname>Mileyko</surname> <given-names>Y.</given-names></name> <name><surname>Bucksch</surname> <given-names>A.</given-names></name> <name><surname>Moore</surname> <given-names>B.</given-names></name> <name><surname>Symonova</surname> <given-names>O.</given-names></name> <name><surname>Price</surname> <given-names>C. A.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>GiA Roots: software for the high throughput analysis of plant root system architecture</article-title>. <source>BMC Plant Biol.</source> <volume>12</volume>:<fpage>116</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2229-12-116</pub-id><pub-id pub-id-type="pmid">22834569</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Huynh-Thu</surname> <given-names>V. A.</given-names></name> <name><surname>Wehenkel</surname> <given-names>L.</given-names></name> <name><surname>Geurts</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <source>Gene Regulatory Network Inference from Systems Genetics Data Using Tree-Based Methods</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koevoets</surname> <given-names>I. T.</given-names></name> <name><surname>Venema</surname> <given-names>J. H.</given-names></name> <name><surname>Elzenga</surname> <given-names>J. T.</given-names></name> <name><surname>Testerink</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). <article-title>Roots withstanding their environment: exploiting root system architecture responses to abiotic stress to improve crop tolerance</article-title>. <source>Front. Plant Sci.</source> <volume>7</volume>:<fpage>1335</fpage>. <pub-id pub-id-type="doi">10.3389/fpls.2016.01335</pub-id><pub-id pub-id-type="pmid">27630659</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lobet</surname> <given-names>G.</given-names></name> <name><surname>Pound</surname> <given-names>M. P.</given-names></name> <name><surname>Diener</surname> <given-names>J.</given-names></name> <name><surname>Pradal</surname> <given-names>C.</given-names></name> <name><surname>Draye</surname> <given-names>X.</given-names></name> <name><surname>Godin</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Root system markup language: toward a unified root architecture description language</article-title>. <source>Plant Physiol.</source> <volume>167</volume>, <fpage>617</fpage>&#x02013;<lpage>627</lpage>. <pub-id pub-id-type="doi">10.1104/pp.114.253625</pub-id><pub-id pub-id-type="pmid">25614065</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x000E9;e</surname> <given-names>R.</given-names></name> <name><surname>Geurts</surname> <given-names>P.</given-names></name> <name><surname>Wehenkel</surname> <given-names>L.</given-names></name></person-group> (<year>2016</year>). <article-title>Towards generic image classification using tree-based learning: an extensive empirical study</article-title>. <source>Pattern Recognit. Lett.</source> <volume>74</volume>, <fpage>17</fpage>&#x02013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1016/j.patrec.2016.01.006</pub-id></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pag&#x000E8;s</surname> <given-names>L.</given-names></name> <name><surname>B&#x000E9;cel</surname> <given-names>C.</given-names></name> <name><surname>Boukcim</surname> <given-names>H.</given-names></name> <name><surname>Moreau</surname> <given-names>D.</given-names></name> <name><surname>Nguyen</surname> <given-names>C.</given-names></name> <name><surname>Voisin</surname> <given-names>A.-S.</given-names></name></person-group> (<year>2013</year>). <article-title>Calibration and evaluation of ArchiSimple, a simple model of root system architecture</article-title>. <source>Ecol. Modell.</source> <volume>290</volume>, <fpage>76</fpage>&#x02013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1016/j.ecolmodel.2013.11.014</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pag&#x000E8;s</surname> <given-names>L.</given-names></name> <name><surname>Jordan</surname> <given-names>M. O.</given-names></name> <name><surname>Picard</surname> <given-names>D.</given-names></name></person-group> (<year>1989</year>). <article-title>A simulation model of the three-dimensional architecture of the maize root system</article-title>. <source>Plant Soil</source> <volume>119</volume>, <fpage>147</fpage>&#x02013;<lpage>154</lpage>. <pub-id pub-id-type="doi">10.1007/BF02370279</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pag&#x000E8;s</surname> <given-names>L.</given-names></name> <name><surname>Pellerin</surname> <given-names>S.</given-names></name></person-group> (<year>1996</year>). <article-title>Study of differences between vertical root maps observed in a maize crop and simulated maps obtained using a model for the three-dimensional architecture of the root system</article-title>. <source>Plant Soil</source> <volume>182</volume>, <fpage>329</fpage>&#x02013;<lpage>337</lpage>. <pub-id pub-id-type="doi">10.1007/BF00029063</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pag&#x000E8;s</surname> <given-names>L.</given-names></name> <name><surname>Vercambre</surname> <given-names>G.</given-names></name> <name><surname>Drouet</surname> <given-names>J.-L.</given-names></name> <name><surname>Lecompte</surname> <given-names>F.</given-names></name> <name><surname>Collet</surname> <given-names>C.</given-names></name> <name><surname>LeBot</surname> <given-names>J.</given-names></name></person-group> (<year>2004</year>). <article-title>RootTyp: a generic model to depict and analyze the root system architecture</article-title>. <source>Plant Soil</source> <volume>258</volume>, <fpage>103</fpage>&#x02013;<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1023/B:PLSO.0000016540.47134.03</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pierret</surname> <given-names>A.</given-names></name> <name><surname>Gonkhamdee</surname> <given-names>S.</given-names></name> <name><surname>Jourdan</surname> <given-names>C.</given-names></name> <name><surname>Maeght</surname> <given-names>J.-L.</given-names></name></person-group> (<year>2013</year>). <article-title>IJ-Rhizo: an open-source software to measure scanned images of root samples</article-title>. <source>Plant Soil</source> <volume>373</volume>, <fpage>531</fpage>&#x02013;<lpage>539</lpage>. <pub-id pub-id-type="doi">10.1007/s11104-013-1795-9</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rell&#x000E1;n-&#x000C1;lvarez</surname> <given-names>R.</given-names></name> <name><surname>Lobet</surname> <given-names>G.</given-names></name> <name><surname>Lindner</surname> <given-names>H.</given-names></name> <name><surname>Pradier</surname> <given-names>P.-L.</given-names></name> <name><surname>Sebastian</surname> <given-names>J.</given-names></name> <name><surname>Yee</surname> <given-names>M.-C.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>GLO-Roots: an imaging platform enabling multidimensional characterization of soil-grown root systems</article-title>. <source>Elife</source> <volume>4</volume>:<fpage>e07597</fpage>. <pub-id pub-id-type="doi">10.7554/eLife.07597</pub-id><pub-id pub-id-type="pmid">26287479</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sarkar</surname> <given-names>D.</given-names></name></person-group> (<year>2008</year>). <source>Lattice: Multivariate Data Visualization with R</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B19">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wickham</surname> <given-names>H.</given-names></name></person-group> (<year>2009</year>). <source>ggplot2</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer New York</publisher-name>.</citation>
</ref>
</ref-list>
<fn-group>
<fn id="fn0001"><p><sup>1</sup>R Core Team R: A Language and Environment for Statistical Computing.</p></fn>
</fn-group>
</back>
</article>