<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Syst. Biol.</journal-id>
<journal-title>Frontiers in Systems Biology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Syst. Biol.</abbrev-journal-title>
<issn pub-type="epub">2674-0702</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">893366</article-id>
<article-id pub-id-type="doi">10.3389/fsysb.2023.893366</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Systems Biology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Clonal abundance patterns in hematopoiesis: Mathematical modeling and parameter estimation</article-title>
<alt-title alt-title-type="left-running-head">Pan et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fsysb.2023.893366">10.3389/fsysb.2023.893366</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Pan</surname>
<given-names>Yunbei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1517168/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>D&#x2019;Orsogna</surname>
<given-names>Maria R.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1376780/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Tang</surname>
<given-names>Min</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1772649/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Stiehl</surname>
<given-names>Thomas</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Chou</surname>
<given-names>Tom</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1315665/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Computational Medicine</institution>, <institution>UCLA</institution>, <addr-line>Los Angeles</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Mathematics</institution>, <institution>California State University at Northridge</institution>, <addr-line>Los Angeles</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Institute of Natural Sciences</institution>, <institution>Shanghai Jiaotong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Institute of Computational Biomedicine</institution>, <institution>RWTH Aachen University</institution>, <addr-line>Aachen</addr-line>, <country>Germany</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Mathematics</institution>, <institution>UCLA</institution>, <addr-line>Los Angeles</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/115285/overview">Jayajit Das</ext-link>, The Ohio State University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/307667/overview">Steven M. Abel</ext-link>, The University of Tennessee, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1730471/overview">Wenjie Sun</ext-link>, Institute Curie, France</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Maria R. D&#x2019;Orsogna, <email>dorsogna@csun.edu</email>; Min Tang, <email>tangmin@sjtu.edu.cn</email>; Tom Chou, <email>tomchou@ucla.edu</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Integrative Systems Immunology, a section of the journal Frontiers in Systems Biology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>02</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>3</volume>
<elocation-id>893366</elocation-id>
<history>
<date date-type="received">
<day>10</day>
<month>03</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>01</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Pan, D&#x2019;Orsogna, Tang, Stiehl and Chou.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Pan, D&#x2019;Orsogna, Tang, Stiehl and Chou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Hematopoiesis has been studied <italic>via</italic> stem cell labeling using barcodes, viral integration sites (VISs), or <italic>in situ</italic> methods. Subsequent proliferation and differentiation preserve the tag identity, thus defining a clone of mature cells across multiple cell type or lineages. By tracking the population of clones, measured within samples taken at discrete time points, we infer physiological parameters associated with a hybrid stochastic-deterministic mathematical model of hematopoiesis. We analyze clone population data from Koelle et al. (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) and compare the states of clones (mean and variance of their abundances) and the state-space density of clones with the corresponding quantities predicted from our model. Comparing our model to the tagged granulocyte populations, we find parameters (stem cell carrying capacity, stem cell differentiation rates, and the proliferative potential of progenitor cells, and sample sizes) that provide reasonable fits in three out of four animals. Even though some observed features cannot be quantitatively reproduced by our model, our analyses provides insight into how model parameters influence the underlying mechanisms in hematopoiesis. We discuss additional mechanisms not incorporated in our model.</p>
</abstract>
<kwd-group>
<kwd>stem cells</kwd>
<kwd>hematopoiesis</kwd>
<kwd>barcodes</kwd>
<kwd>clonal tracking</kwd>
<kwd>differentiation</kwd>
</kwd-group>
<contract-num rid="cn001">R01HL146552</contract-num>
<contract-num rid="cn002">W911NF-18-1-0345</contract-num>
<contract-num rid="cn003">DMS-1814090</contract-num>
<contract-sponsor id="cn001">Office of Extramural Research, National Institutes of Health<named-content content-type="fundref-id">10.13039/100006955</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Army Research Office<named-content content-type="fundref-id">10.13039/100000183</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">National Science Foundation<named-content content-type="fundref-id">10.13039/100000001</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Hematopoiesis, the process by which hematopoietic stem cells (HSCs) generate all mature blood cells in an animal through proliferation and differentiation plays a crucial role in an organism&#x2019;s immune response and maintaining overall homeostasis. Estimates of the number of actively cycling HSC range from 50000&#x2013;200000 in humans (<xref ref-type="bibr" rid="B30">Lee-Six et al., 2018</xref>) and approximately 5,000 in mice (<xref ref-type="bibr" rid="B6">Busch et al., 2015</xref>; <xref ref-type="bibr" rid="B35">Mayle et al., 2015</xref>). It is well-known that these small numbers of hematopoietic stem cells can generate 10<sup>10</sup>&#x2013;10<sup>12</sup> cells of multiple cell types daily, over an organism&#x2019;s lifetime (<xref ref-type="bibr" rid="B19">Fliedner, 2002</xref>; <xref ref-type="bibr" rid="B17">Doulatov et al., 2012</xref>). Understanding the mechanisms of hematopoiesis can help guide clinical treatment, especially those related to bone marrow transplantation and in the context of blood cancers (<xref ref-type="bibr" rid="B36">Mendelson and Frenette, 2014</xref>; <xref ref-type="bibr" rid="B6">Busch et al., 2015</xref>; <xref ref-type="bibr" rid="B22">Goyal et al., 2015</xref>).</p>
<p>HSCs are often quiescent (<xref ref-type="bibr" rid="B43">Seita and Weissman, 2010</xref>), making them hard to track <italic>in vivo</italic> and difficult to control <italic>in vitro</italic>. Thus, the HSC dynamics <italic>in vivo</italic> can only be straightforwardly interrogated through analysis of populations of more downstream progenitors and differentiated blood cells (<xref ref-type="bibr" rid="B7">Bystrykh et al., 2012</xref>). One way to quantitatively probe the hematopoiesis process is the labeling of multipotent HSCs by tagging their genomes. The tags can take the form of viral integration sites or barcodes (<xref ref-type="bibr" rid="B23">Grosselin et al., 2013</xref>; <xref ref-type="bibr" rid="B25">Kim et al., 2014</xref>; <xref ref-type="bibr" rid="B52">Wu et al., 2014</xref>; <xref ref-type="bibr" rid="B4">Biasco et al., 2016</xref>; <xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>). In a typical <italic>in vivo</italic> experiment, CD34<sup>&#x2b;</sup> stem cells are extracted, tagged, and then autologously transplanted back into the animal, typically a mouse or a rhesus macaque. CD34<sup>&#x2b;</sup> cells contain HSCs as well as early hematopoietic stem and progenitor cells (HSPCs), with a wide range of estimated relative proportions (<xref ref-type="bibr" rid="B14">Corso et al., 2005</xref>; <xref ref-type="bibr" rid="B3">Attar, 2014</xref>; <xref ref-type="bibr" rid="B38">Parmentier et al., 2020</xref>). The downstream progenitor and mature cells that derive from proliferation of HSCs of a particular tag will form a clone of cells that share the same tag. Clonal tracking of cell tags is thus a powerful tool for interrogating the differentiation process during hematopoiesis (<xref ref-type="bibr" rid="B33">Lyne et al., 2018</xref>; <xref ref-type="bibr" rid="B9">Challen and Goodell, 2020</xref>; <xref ref-type="bibr" rid="B13">Cordes et al., 2021</xref>). For example, the abundances of the different tags that appear in the different types of mature cells can shed light on the branching structure of differentiation and on proliferation dynamics, particularly when coupled with mathematical models and/or simulations (<xref ref-type="bibr" rid="B46">Stiehl and Marciniak-Czochra, 2011</xref>; <xref ref-type="bibr" rid="B48">Sun and Komarova, 2012</xref>; <xref ref-type="bibr" rid="B49">Sz&#xe9;kely et al., 2014</xref>; <xref ref-type="bibr" rid="B24">H&#xf6;fer and Rodewald, 2016</xref>; <xref ref-type="bibr" rid="B53">Xu J. et al., 2018</xref>).</p>
<p>Clonal tracking in mice (<xref ref-type="bibr" rid="B12">Copley et al., 2012</xref>; <xref ref-type="bibr" rid="B47">Sun et al., 2014</xref>) has revealed the timescales of repopulation dynamics under homeostasis and after bone marrow transplantation (<xref ref-type="bibr" rid="B37">Muller-Sieburg et al., 2012</xref>; <xref ref-type="bibr" rid="B50">Verovskaya et al., 2013</xref>; <xref ref-type="bibr" rid="B6">Busch et al., 2015</xref>), but typically involves very few clones that cover only a small fraction of the HSC population. To transplant many HSC clones in order to see patterns of how clones are distributed during hematopoiesis requires experiments on animals larger than mice.</p>
<p>Transplant experiments in rhesus macaque on the other hand allow for hundreds or thousands of clones to be engrafted into an organism that exhibits population levels and timescales closer to those in humans. One experiment in rhesus macaque involved tracking HSC clonal dynamics of lentivirus-tagged HSCs and early progenitor cells (HSPCs), and following hematopoiesis over a time period comparable to the animal&#x2019;s life-span (<xref ref-type="bibr" rid="B26">Kim et al., 2010</xref>, <xref ref-type="bibr" rid="B25">2014</xref>). Here, CD34<sup>&#x2b;</sup> HSPCs from the bone marrow, which include various progenitor cells, were marked <italic>via</italic> the integration of a lentivirus vector with an accompanying green fluorescent protein (GFP) tag at random viral integration sites (VISs). After sublethal myeloablative irradiation to eliminate a substantial number of cells in the bone marrow, the tagged HSPCs were autologously transplanted. If these cells divide and differentiate after transplantation, their progeny will inherit the unique VISs. Sampling and sequencing of these mature cells indicates which ones are descendants of a founder HSC. Data collected from four macaques over 14&#xa0;years were analyzed showing how bias towards the lymphoid or myeloid differentiation branches changes over time. More detailed analyses were also performed in order to connect clonal patterns during hematopoiesis with a mathematical model that describes how self-renewal, differentiation, and subsampling of a multiclone population affects clone abundances and their fluctuations across time (<xref ref-type="bibr" rid="B22">Goyal et al., 2015</xref>; <xref ref-type="bibr" rid="B55">Xu S. et al., 2018</xref>). By fitting a simple mechanistic model to abundances of hundreds to thousands of clones, random initial differentiation events that each led to a subsequent burst of mature cells was proposed as a mechanism to explain observed population fluctuations. The number of generations <italic>L</italic> that progenitor cells traverse along a differentiation pathway (lineage) before terminal differentiation was also estimated to be <italic>L</italic> &#x223c; 24 for the granulocyte lineage (<xref ref-type="bibr" rid="B55">Xu S. et al., 2018</xref>). To obtain this result, a mean-field model for HSC self-renewal was developed and applied to experimental data on granulocytes, using only the mean and variance of clone populations in the data fitting.</p>
<p>In this paper, we improve on the model used in (<xref ref-type="bibr" rid="B55">Xu S. et al., 2018</xref>) by developing a framework that can explain population transients and that can predict the density of the number of clones with respect to mean clone sizes. Instead of analyzing VIS data from (<xref ref-type="bibr" rid="B26">Kim et al., 2010</xref>, <xref ref-type="bibr" rid="B25">2014</xref>), we consider the barcode data from (<xref ref-type="bibr" rid="B52">Wu et al., 2014</xref>; <xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>). In the latter experimental studies, replication-incompetent HIV-derived lentiviral barcoding vectors were used to tag HSCs that were transplanted into four rhesus macaques. The barcode consists of a six base-pair library identification and a 35 base pair high-diversity cellular barcode. As with the VIS experiments, barcoded cells were reinfused in the animals after myeloablative total-body irradiation. Purified samples of blood cells were then subject to low-cycle PCR amplification with the two primers bracketing the barcode. This barcoding approach provides more precise quantification relative to other clonal tracking protocols such as VIS (<xref ref-type="bibr" rid="B25">Kim et al., 2014</xref>) and transposon tagging (<xref ref-type="bibr" rid="B47">Sun et al., 2014</xref>) approaches. Thus, we will analyze the barcoding data <italic>via</italic> a mathematical model with the goal of more accurately estimating physiological parameters such as HSC carrying capacity, progenitor cell division rates, and progenitor cell proliferative potential for the granulocyte cell lineage. Although clonal structure of mature cells of different lineages, such as T, B, monocytes, and NK cells, were quantified in (<xref ref-type="bibr" rid="B52">Wu et al., 2014</xref>; <xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>), lymphocyte maturation is more complex, involving additional intermediate steps and subsequent immune signaling and mature cell proliferation. Thus, we focus on the simpler and abundant mature granulocyte population (<xref ref-type="bibr" rid="B7">Bystrykh et al., 2012</xref>).</p>
<p>In the following Materials and Methods section, we briefly describe the raw data and present the mathematical model. In the Data Analysis and Results section, we describe how measured clone data is compared to predicted clone abundances and show that minimization of the difference leads to reasonable estimates of parameter estimates. Finally, in the Discussion and Conclusions, we provide qualitative insight into how model parameters affect the predicted clonal patterns and discuss further improvements and potential new modeling directions.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and methods</title>
<p>In this section, we describe information extracted from the granulocyte abundance data in (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) and the mathematical model used to describe this data. The experimental parameters associated with the experiments are listed in <xref ref-type="table" rid="T1">Table 1</xref>, which lists the number of cells (tagged and untagged) transplanted, the barcode library size used, and the total number of different barcodes observed across all samples of all lineages for each animal. These values inform us on the typical magnitude of experimental parameters to which our subsequent model must conform. In <xref ref-type="table" rid="T2">Table 2</xref>, we list parameters used in our mathematical model as determined either from experimental data or through estimates.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Transplant parameters. The initial transplant populations for the four animals ZH33, ZG66, ZH19, and ZJ31. The total library size for the cell preparation was in the range <italic>C</italic>
<sub>
<italic>L</italic>
</sub> &#x3d; 53319 &#x2212; 109085. The total number of cells injected was <italic>H</italic> &#x3d; 2.3 &#xd7; 10<sup>7</sup> &#x2212; 4.8 &#xd7; 10<sup>7</sup>, of which <italic>H</italic>&#x2a; &#x3d; 8.0 &#xd7; 10<sup>6</sup> &#x2212; 1.67 &#xd7; 10<sup>7</sup> were barcoded (corresponding to 23%&#x2013;35% GFP&#x2b; labeling). Across all peripheral blood samples and cell lineages, the total number of barcodes detected in each animal was in the range <inline-formula id="inf1">
<mml:math id="m1">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>21450</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>62354</mml:mn>
</mml:math>
</inline-formula>, <italic>i.e.</italic>, roughly half of injected HSC barcodes were detected in the peripheral blood samples. Among granulocytes, the total sampled richness (across all time points) ranged from 2660 &#x2212; 32363.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Variable Animal</th>
<th align="center">Library size <italic>C</italic>
<sub>
<italic>L</italic>
</sub>
</th>
<th align="center">Injected cells <italic>H</italic>
</th>
<th align="center">Injected GFP&#x2b; <italic>H</italic>&#x2a;</th>
<th align="center">Total <italic>C</italic>
<sub>s</sub>
</th>
<th align="center">
<italic>C</italic>
<sub>s</sub> (grans)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">ZH33</td>
<td align="center">63469</td>
<td align="center">3.2 &#xd7; 10<sup>7</sup>
</td>
<td align="center">1.11 &#xd7; 10<sup>7</sup>
</td>
<td align="center">25325</td>
<td align="center">9221</td>
</tr>
<tr>
<td align="left">ZG66</td>
<td align="center">53613</td>
<td align="center">4.8 &#xd7; 10<sup>7</sup>
</td>
<td align="center">1.67 &#xd7; 10<sup>7</sup>
</td>
<td align="center">21450</td>
<td align="center">2660</td>
</tr>
<tr>
<td align="left">ZH19</td>
<td align="center">53319</td>
<td align="center">4.8 &#xd7; 10<sup>7</sup>
</td>
<td align="center">1.1 &#xd7; 10<sup>7</sup>
</td>
<td align="center">31929</td>
<td align="center">10964</td>
</tr>
<tr>
<td align="left">ZJ31</td>
<td align="center">109085</td>
<td align="center">2.3 &#xd7; 10<sup>7</sup>
</td>
<td align="center">8.0 &#xd7; 10<sup>6</sup>
</td>
<td align="center">62354</td>
<td align="center">32363</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Overview of variables and parameters. Parameters and variables and their estimated values if known. Some values need to be calculated from our model and are denoted &#x201c;calc.,&#x201d; while others need to be self-consistently estimated. For example, from GFP tagging, the fraction of tagged HSCs is approximately <inline-formula id="inf2">
<mml:math id="m2">
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:mn>15</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>35</mml:mn>
<mml:mi>%</mml:mi>
</mml:math>
</inline-formula> but can slowly vary in time. Values relating to sampled cell populations are derived from animal ZH33 in the experiment of (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>). HSC proliferation and death rates have been estimated in (<xref ref-type="bibr" rid="B44">Shepherd et al., 2007</xref>) and (<xref ref-type="bibr" rid="B8">Catlin et al., 2011</xref>). Numbers specific to granulocytes are indicated as such.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Variables/Parameters</th>
<th align="left">Definition</th>
<th align="left">Value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">
<italic>t</italic>
<sub>
<italic>j</italic>
</sub>, <italic>j</italic> &#x3d; 1, &#x2026;, <italic>J</italic>
</td>
<td align="left">Sampling time points</td>
<td align="left">&#x223c;month</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf3">
<mml:math id="m3">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>
</td>
<td align="left">No. of cells with tag <italic>i</italic> in sample drawn at <italic>t</italic>
<sub>
<italic>j</italic>
</sub> (data)</td>
<td align="left">
<inline-formula id="inf4">
<mml:math id="m4">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf5">
<mml:math id="m5">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="left">Mean no. of cells with tag <italic>i</italic> in sample (data)</td>
<td align="left">
<inline-formula id="inf6">
<mml:math id="m6">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="left">Total no. of tagged granulocytes in each sample at <italic>t</italic>
<sub>
<italic>j</italic>
</sub> (data)</td>
<td align="left">
<inline-formula id="inf8">
<mml:math id="m8">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>6</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf9">
<mml:math id="m9">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>2</mml:mn>
<mml:mspace width="0.3333em"/>
<mml:mtext>months</mml:mtext>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="left">Total no. of clones (richness) in sample <italic>j</italic>
</td>
<td align="left">
<inline-formula id="inf10">
<mml:math id="m10">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1000</mml:mn>
</mml:math>
</inline-formula> (grans)</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf11">
<mml:math id="m11">
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>
</td>
<td align="left">Total richness across all <italic>t</italic> &#x3e; <italic>t</italic>
<sub>2</sub>
</td>
<td align="left">2,335 (grans)</td>
</tr>
<tr>
<td align="center">
<italic>h</italic>
<sub>0</sub>
</td>
<td align="left">Untagged HSCs in bone marrow (model)</td>
<td align="left">unknown, <inline-formula id="inf12">
<mml:math id="m12">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<italic>h</italic>
<sub>
<italic>i</italic>
</sub>, <italic>i</italic> &#x3d; 1, &#x2026;, <italic>C</italic>
<sub>h</sub>
</td>
<td align="left">HSCs with barcode <italic>i</italic> in BM (model)</td>
<td align="left">1&#x2013;1,000</td>
</tr>
<tr>
<td align="center">
<inline-formula id="inf13">
<mml:math id="m13">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="left">No. of <italic>&#x2113;</italic>
<sup>th</sup>-generation progenitor cells with tag/barcode <italic>i</italic> (model)</td>
<td align="left">calc</td>
</tr>
<tr>
<td align="center">
<italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>)</td>
<td align="left">No. mature cells with tag <italic>i</italic> (model)</td>
<td align="left">calc</td>
</tr>
<tr>
<td align="center">
<italic>s</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>)&#xa0;</td>
<td align="left">No. of cells with tag <italic>i</italic> in sample (model)</td>
<td align="left">calc</td>
</tr>
<tr>
<td align="center">
<italic>K</italic>
</td>
<td align="left">HSC niche carrying capacity (model)</td>
<td align="left">inferred, 10<sup>4</sup>&#x2013;10<sup>5</sup>
</td>
</tr>
<tr>
<td align="center">
<italic>C</italic>
<sub>h</sub>(<italic>t</italic>)</td>
<td align="left">Total no. of engrafted clones (model)</td>
<td align="left">unknown, <inline-formula id="inf14">
<mml:math id="m14">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<italic>C</italic>
<sub>s</sub>(<italic>t</italic>)</td>
<td align="left">Total no. of clones sampled at <italic>t</italic> (model)</td>
<td align="left">simulated</td>
</tr>
<tr>
<td align="center">
<italic>r</italic>
<sub>h</sub>(0)</td>
<td align="left">Intrinsic HSC self-renewal rate</td>
<td align="left">&#x226b; 0.01/day</td>
</tr>
<tr>
<td align="center">
<italic>&#x3bc;</italic>
<sub>h</sub>
</td>
<td align="left">HSC death rate</td>
<td align="left">
<inline-formula id="inf15">
<mml:math id="m15">
<mml:mo>&#x3c;</mml:mo>
<mml:mn>0.01</mml:mn>
</mml:math>
</inline-formula>/day</td>
</tr>
<tr>
<td align="center">
<italic>&#x3b1;</italic>
</td>
<td align="left">HSC differentiation rate</td>
<td align="left">10<sup>&#x2013;3</sup> &#x2212; 0.02/day, inferred</td>
</tr>
<tr>
<td align="center">
<italic>r</italic>
<sub>n</sub>
</td>
<td align="left">Progenitor cell division rate</td>
<td align="left">1&#x2013;5/day</td>
</tr>
<tr>
<td align="center">
<italic>&#x3bc;</italic>
<sub>n</sub>
</td>
<td align="left">Progenitor cell death rate</td>
<td align="left">unknown, <inline-formula id="inf16">
<mml:math id="m16">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>0</mml:mn>
</mml:math>
</inline-formula>/day</td>
</tr>
<tr>
<td align="center">
<italic>&#x3c9;</italic>
</td>
<td align="left">Progenitor cell terminal differentiation rate</td>
<td align="left">unknown, <inline-formula id="inf17">
<mml:math id="m17">
<mml:mo>&#x3c;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<italic>L</italic>
</td>
<td align="left">Proliferative potential of progenitor cells</td>
<td align="left">inferred, <italic>L</italic>&#x2a; &#x3d; 22 (grans)</td>
</tr>
<tr>
<td align="center">
<italic>&#x3bc;</italic>
<sub>m</sub>
</td>
<td align="left">Mature cell death rate</td>
<td align="left">0.185/day (grans)</td>
</tr>
<tr>
<td align="center">
<italic>&#x3b7;</italic>
</td>
<td align="left">Average sample fraction</td>
<td align="left">
<inline-formula id="inf18">
<mml:math id="m18">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
<tr>
<td align="center">
<italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>)</td>
<td align="left">Fraction of sample <italic>j</italic>
</td>
<td align="left">
<inline-formula id="inf19">
<mml:math id="m19">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s2-1">
<title>Measured quantities</title>
<p>First, we consider the observed data associated with each animal (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>), as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. Granulocytes in blood samples drawn from each animal at times points <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, <italic>j</italic> &#x3d; 1, 2, &#x2026;, <italic>J</italic> are sequenced and clonal (barcode) abundances tabulated. The total abundance (number of mature cells of a given cell type), <inline-formula id="inf20">
<mml:math id="m20">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, and the richness <inline-formula id="inf21">
<mml:math id="m21">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> (the total number of different barcodes detected in each sample) are also recorded and plotted in <xref ref-type="fig" rid="F1">Figures 1A, B</xref>. In this study, <inline-formula id="inf22">
<mml:math id="m22">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> denotes the total measured number of granulocytes (barcoded and unbarcoded) in a sample taken at time <italic>t</italic>
<sub>
<italic>j</italic>
</sub>. The fluctuations of <inline-formula id="inf23">
<mml:math id="m23">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf24">
<mml:math id="m24">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> across <italic>t</italic>
<sub>
<italic>j</italic>
</sub> may arise from varying sampled sizes across time points and/or fluctuations in the state of the animal.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>After transplantation, peripheral blood samples were taken across <italic>J</italic> time points <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, <italic>j</italic> &#x3d; 1, &#x2026;, <bold>(J)</bold>. Typically, measurements were taken over 20&#x2013;49&#xa0;months and <italic>J</italic> &#x3d; 10 &#x2212; 15. <bold>(A)</bold> The total population <inline-formula id="inf25">
<mml:math id="m25">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> of granulocytes sampled from animal ZH33 (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) at times <italic>t</italic>
<sub>
<italic>j</italic>
</sub> &#x3d; (1, 2, 3, 4.5, 6.5, 9.5, 12, 14, 21, 28, 30, 38, 43, 46, 49) months. <bold>(B)</bold> The total richness in each sample, <inline-formula id="inf26">
<mml:math id="m26">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. The richness at the first two time samples are large (as we shall see, due to transplantation of barcoded progenitor cells). After the first two time points, where the richness will arise from the richness of the transplanted HSCs, the typical richness at each time point <inline-formula id="inf27">
<mml:math id="m27">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2273;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:mn>1000</mml:mn>
</mml:math>
</inline-formula>, while the richness across all <italic>J</italic> &#x2212; 2 time points (for <italic>t</italic>
<sub>
<italic>j</italic>
</sub> &#x3e; 2 months) is <inline-formula id="inf28">
<mml:math id="m28">
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2335</mml:mn>
</mml:math>
</inline-formula>. Across <italic>all</italic> <italic>J</italic> <italic>time points</italic>, 9,221 unique granulocyte clones were detected (out of a total of 25325 across <italic>all cell types</italic>). The individual clone abundances in the sampled granulocyte population are shown in <bold>(C)</bold> where the abundances of clone <italic>i</italic> in a sample taken at time <italic>t</italic>
<sub>
<italic>j</italic>
</sub> are denoted by <inline-formula id="inf29">
<mml:math id="m29">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. The mean and standard deviation <inline-formula id="inf30">
<mml:math id="m30">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> of the abundances of all clones across all sampling times are calculated using Eq. <xref ref-type="disp-formula" rid="e1">1</xref> and scatter-plotted in <bold>(D)</bold>. Each point represents one of the 2,335 detected granulocyte clones. </p>
</caption>
<graphic xlink:href="fsysb-03-893366-g001.tif"/>
</fig>
<p>An example of the abundances of each clone within the granulocyte population from Koelle et al. (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) is shown in <xref ref-type="fig" rid="F1">Figure 1C</xref>. In these experiments, tagged stem cells are transplanted back into a rhesus macaque at <italic>t</italic> &#x3d; 0 so that initially each clone consists of a single cell. A series of 1 &#x2264; <italic>j</italic> &#x2264; <italic>J</italic> samples are taken at time <italic>t</italic>
<sub>
<italic>j</italic>
</sub> after implementation, yielding a set of mature cells. We denote the abundance of clone <italic>i</italic> (among granulocyte cells) in the sample taken at time <italic>t</italic>
<sub>
<italic>j</italic>
</sub> after transplantation as <inline-formula id="inf31">
<mml:math id="m31">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. The <italic>J</italic> measurements allow each clone of a particular mature cell type <italic>i</italic> to be characterized by a mean <inline-formula id="inf32">
<mml:math id="m32">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> and variance <inline-formula id="inf33">
<mml:math id="m33">
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> defined by<disp-formula id="e1">
<mml:math id="m34">
<mml:mtable class="aligned">
<mml:mtr>
<mml:mtd columnalign="right">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="right">
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>J</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
<label>(1)</label>
</disp-formula>
</p>
<p>Note that the total measured population of any cell type <inline-formula id="inf34">
<mml:math id="m35">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. A scatter plot of <inline-formula id="inf35">
<mml:math id="m36">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> versus <inline-formula id="inf36">
<mml:math id="m37">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> for all clones detected in a sample of granulocytes is shown in <xref ref-type="fig" rid="F1">Figure 1D</xref>.</p>
<p>For each clone at <inline-formula id="inf37">
<mml:math id="m38">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> we can evaluate the local density <inline-formula id="inf38">
<mml:math id="m39">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>, the number of clones within some size window. This density can be viewed as the concentration of data points shown in <xref ref-type="fig" rid="F1">Figure 1D</xref> as a function of mean clone size <inline-formula id="inf39">
<mml:math id="m40">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>, and will be constructed using kernel density estimation (<xref ref-type="bibr" rid="B42">Rosenblatt, 1956</xref>; <xref ref-type="bibr" rid="B39">Parzen, 1962</xref>) of the data points in <inline-formula id="inf40">
<mml:math id="m41">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mspace width="0.3333em"/>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> space. The unknown density function <inline-formula id="inf41">
<mml:math id="m42">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is obtained by concatenating isotropic Gaussian kernel functions about each point and using an optimal, common bandwidth parameter, typically chosen as the value that minimizes the mean integrated squared error, or Kernel Density Estimation (KDE) (<xref ref-type="bibr" rid="B45">Silverman, 1986</xref>). The reconstructed density function can be thought of as a probability that a random clone arises in the volume (<italic>s</italic>, <italic>s</italic> &#x2b; d<italic>s</italic>) &#xd7; (<italic>&#x3c3;</italic>, <italic>&#x3c3;</italic> &#x2b; d<italic>&#x3c3;</italic>). For each clone at <inline-formula id="inf42">
<mml:math id="m43">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> we can evaluate the local density <inline-formula id="inf43">
<mml:math id="m44">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
<p>In the remainder of this paper we will develop a mathematical model that we can simulate to generate total populations, clonal populations, and their associated attributes (<italic>s</italic>
<sub>
<italic>i</italic>
</sub>, <italic>&#x3c3;</italic>
<sub>
<italic>i</italic>
</sub>, <italic>&#x3c1;</italic>
<sub>
<italic>i</italic>
</sub>). Note that while there are many existing mathematical models of hematopoiesis (<xref ref-type="bibr" rid="B11">Colijn and Mackey, 2005</xref>; <xref ref-type="bibr" rid="B40">Peixoto et al., 2011</xref>; <xref ref-type="bibr" rid="B16">De Souza and Humphries, 2019</xref>), they describe only time variations in total populations, rather than that of lower-population, individual clones. We will tune parameters of the model so that its predictions provide a reasonable match to the aforementioned measurements, paying particular attention to clone abundances and clone size variability.</p>
</sec>
<sec id="s2-2">
<title>Mathematical modeling</title>
<p>Our mathematical model incorporates known and accepted features of hematopoiesis. Three main cell compartments are considered: hematopoietic stem cells (HSCs), transit amplifying progenitor cells, and peripheral mature cells. Although the stem cell population in bone marrow is large and can be described using a deterministic model, the initial populations within each clone are small and require a discrete stochastic description. We will then assume that a small sample of mature cells is drawn from the animals at times <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, <italic>j</italic> &#x3d; 1, 2, &#x2026;, <italic>J</italic> and sequenced.</p>
<p>We first describe the initial conditions including the number of HSCs and HSPCs injected into each animal. As listed in <xref ref-type="table" rid="T1">Table 1</xref>, <italic>H</italic> is the total number of HSCs injected into each animal, among which <italic>H</italic>
<sub>0</sub> are untagged and <italic>H</italic>
<sub>
<italic>i</italic>
</sub> &#x226A; <italic>H</italic>
<sub>0</sub> contain barcode 1 &#x2264; <italic>i</italic> &#x2264; <italic>C</italic>
<sub>
<italic>H</italic>
</sub> (and are GFP&#x2b;). The total tagged HSC population is <inline-formula id="inf44">
<mml:math id="m45">
<mml:msup>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x2261;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> so that <italic>H</italic> &#x3d; <italic>H</italic>
<sub>0</sub> &#x2b; <italic>H</italic>&#x2a;. The richness <italic>C</italic>
<sub>
<italic>H</italic>
</sub> &#x2272; <italic>C</italic>
<sub>
<italic>L</italic>
</sub> is the number of barcodes transferred into the animal, which is comparable to the richness of the barcode library <italic>C</italic>
<sub>
<italic>L</italic>
</sub> used in each experiment. Since <italic>H</italic>
<sub>0</sub> &#x223c; 10<sup>7</sup> &#x226B; <italic>H</italic>
<sub>
<italic>i</italic>
</sub>, we will consider the probability distribution of only the tagged populations, which is described by the multinomial<disp-formula id="e2">
<mml:math id="m46">
<mml:mi>P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi mathvariant="bold">H</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>!</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x220f;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>!</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
<label>(2)</label>
</disp-formula>where <inline-formula id="inf45">
<mml:math id="m47">
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mo>&#x2261;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <italic>H</italic>&#x2a; is the total number of GFP&#x2b; (barcoded) cells. Specifically, for animal ZH33 studied in (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>)) <italic>H</italic> &#x2248; 3 &#xd7; 10<sup>7</sup>, <italic>H</italic>&#x2a;/<italic>H</italic> &#x2248; 0.35, <inline-formula id="inf46">
<mml:math id="m48">
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2248;</mml:mo>
<mml:mn>1.1</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>1</mml:mn>
<mml:msup>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>7</mml:mn>
</mml:mrow>
</mml:msup>
</mml:math>
</inline-formula>, <italic>C</italic>
<sub>
<italic>H</italic>
</sub> &#x2272; <italic>C</italic>
<sub>
<italic>L</italic>
</sub> &#x2248; 6 &#xd7; 10<sup>5</sup>. Thus, the typical <italic>H</italic>
<sub>
<italic>i</italic>
</sub> &#x2248; <italic>H</italic>&#x2a;/<italic>C</italic>
<sub>
<italic>H</italic>
</sub> &#x223c; 180.</p>
<p>A certain fraction <italic>&#x3b7;</italic>
<sub>0</sub> of the <italic>H</italic> HSCs home into the bone marrow, successfully engraft, and subsequently actively self-renewal and/or differentiate. Engrafted HSC populations are defined by <inline-formula id="inf47">
<mml:math id="m49">
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mspace width="-0.17em"/>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, where the richness of engrafted HSCs in the bone marrow is <italic>C</italic>
<sub>h</sub> &#x2272; <italic>C</italic>
<sub>
<italic>H</italic>
</sub>. Transplantation efficiencies are typically single-digit percentages (<xref ref-type="bibr" rid="B1">Abbuehl et al., 2017</xref>; <xref ref-type="bibr" rid="B41">Radtke et al., 2020</xref>) and transplanted CD34<sup>&#x2b;</sup> cells contain significant numbers of progenitor cells. Thus, the fraction <italic>&#x3b7;</italic>
<sub>0</sub> &#x226A; 1; if <italic>&#x3b7;</italic>
<sub>0</sub> is sufficiently small (approximately &#x2272; 1/180), then we can safely assume that the initial clone populations in bone marrow are represented by very few cells. For simplicity, we approximate <italic>h</italic>
<sub>
<italic>i</italic>
</sub>(0) &#x2248; 1. Even if <italic>&#x3b7;</italic>
<sub>0</sub>&#x2270;1/180, most barcodes will be represented by very few cells. We have verified that an initial condition in our model that allows for, say, some <italic>h</italic>
<sub>
<italic>i</italic>
</sub>(0) &#x3d; 2, 3 does not qualitatively affect the mature cell populations.</p>
<p>The random selection of cells into the bone marrow can be thought of as a sampling (without replacement) process. Including the untagged population, the probability distribution of engrafted cells resulting from the injected tagged cell population <inline-formula id="inf48">
<mml:math id="m50">
<mml:mi mathvariant="bold">H</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is given by<disp-formula id="e3">
<mml:math id="m51">
<mml:mi>P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mi mathvariant="bold">H</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mfrac linethickness="0">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x220f;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:mfenced open="(" close=")">
<mml:mfrac linethickness="0">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:math>
<label>(3)</label>
</disp-formula>where <italic>H</italic>&#x2a; and <inline-formula id="inf49">
<mml:math id="m52">
<mml:msup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> are the total initial numbers of barcoded injected cells and engrafted barcoded HSCs, summed over all clones. Note that the number of untagged transplanted cells <italic>h</italic>
<sub>0</sub>(0) &#x226B; 1 is large so that we can approximate it by its deterministic value <italic>h</italic>
<sub>0</sub>(0) &#x2248; <italic>&#x3b7;</italic>
<sub>0</sub>
<italic>H</italic>
<sub>0</sub>.</p>
<p>To extract the overall probability of initial condition <bold>h</bold>(0), we average Eq. <xref ref-type="disp-formula" rid="e3">3</xref> over the prior <inline-formula id="inf50">
<mml:math id="m53">
<mml:mi>P</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and find<disp-formula id="e4">
<mml:math id="m54">
<mml:mi>P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold">H</mml:mi>
</mml:mrow>
</mml:munder>
<mml:mi>P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mi mathvariant="bold">H</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mi>P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi mathvariant="bold">H</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>!</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x220f;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mspace width="-0.17em"/>
<mml:mspace width="-0.17em"/>
<mml:mspace width="-0.17em"/>
<mml:mspace width="-0.17em"/>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>!</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:msup>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2261;</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>.</mml:mo>
</mml:math>
<label>(4)</label>
</disp-formula>
</p>
<p>Besides the initial condition <italic>h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic> &#x3d; 0) &#x3d; 1, the initial number of untagged HSCs <italic>h</italic>
<sub>0</sub>(<italic>t</italic> &#x3d; 0) is related to the transplantation efficiency and is generally unknown. Barcodes are associated with a GFP tag and the initial fraction of sampled cells that are GFP&#x2b; is <inline-formula id="inf51">
<mml:math id="m55">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>35</mml:mn>
<mml:mi>%</mml:mi>
</mml:math>
</inline-formula>. Since we assume a neutral model, it is reasonable to assume that the fraction of injected tagged cells <italic>H</italic>&#x2a;/<italic>H</italic> is equivalent to the fraction of tagged cells in the engrafted population <inline-formula id="inf52">
<mml:math id="m56">
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:mn>0.35</mml:mn>
</mml:math>
</inline-formula> (although this ratio slowly decreases <italic>via</italic> extinction). The precise richness of HSC population in stem cell niche, <italic>C</italic>
<sub>h</sub>(<italic>t</italic>) &#x3c; <italic>C</italic>
<sub>
<italic>H</italic>
</sub> is also unknown, but except for fluctuations, has a lower bound of <inline-formula id="inf53">
<mml:math id="m57">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, the total number of unique clones detected across all samples across all cell types. Thus, we take <inline-formula id="inf54">
<mml:math id="m58">
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:mn>0.35</mml:mn>
</mml:math>
</inline-formula>.</p>
<p>Self-renewal, death, and differentiation into progenitor cells all contribute to the stochastic dynamics of <italic>h</italic>
<sub>
<italic>i</italic>
</sub>. Although the <italic>total</italic> HSC population in the niche <inline-formula id="inf55">
<mml:math id="m59">
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is large and can be approximated deterministically, the HSC population of each clone <italic>h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) may be small and must be treated stochastically. Under our neutral assumption, the intrinsic self-renewal rate <italic>r</italic>
<sub>h</sub> of HSCs does not depend on the barcode identity <italic>i</italic>. Since HSCs reside in niches in the bone marrow that place limits on growth, we assume the HSC proliferation rate follows a linearly decreasing form defined by a carrying capacity and the engrafted HSC population <italic>h</italic>(<italic>t</italic>)<disp-formula id="e5">
<mml:math id="m60">
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi>K</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
<mml:mspace width="0.3333em"/>
<mml:mspace width="0.3333em"/>
<mml:mspace width="0.3333em"/>
<mml:mspace width="0.3333em"/>
<mml:mtext>, </mml:mtext>
<mml:mspace width="0.3333em"/>
<mml:mspace width="0.3333em"/>
<mml:mspace width="0.3333em"/>
<mml:mi>h</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2261;</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:math>
<label>(5)</label>
</disp-formula>where <italic>r</italic>
<sub>h</sub>(0) is the intrinsic proliferation rate of a single, isolated HSC. Note that the untagged HSCs are included through <italic>h</italic>
<sub>0</sub>. Finally, we assume that HSCs die at rate <italic>&#x3bc;</italic>
<sub>h</sub> and differentiate at rate <italic>&#x3b1;</italic> and that these rates, like the growth rate in Eq. <xref ref-type="disp-formula" rid="e5">5</xref>, do not depend on barcode identity.</p>
<p>As shown in the <xref ref-type="sec" rid="s10">Supplementary Material</xref>, the richness <italic>C</italic>
<sub>h</sub>(<italic>t</italic>) may progressively decrease from random HSC death and extinction and can be estimated by solving for the stochastic birth-death process (neglecting outflux from differentiation) and using generating functions to find<disp-formula id="e6">
<mml:math id="m61">
<mml:mi mathvariant="double-struck">E</mml:mi>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2248;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x3c8;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3d5;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
<label>(6)</label>
</disp-formula>where<disp-formula id="e7">
<mml:math id="m62">
<mml:mi>&#x3c8;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2261;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:mi>&#x3d5;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2261;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mi>&#x3c8;</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>.</mml:mo>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>In this expression, <italic>r</italic>
<sub>h</sub>(<italic>t</italic>) is approximated by <inline-formula id="inf56">
<mml:math id="m63">
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf57">
<mml:math id="m64">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> is given by the explicit solution to the deterministic birth-death process with carrying capacity <italic>K</italic>. Thus, given <italic>C</italic>
<sub>h</sub>(0), <italic>r</italic>
<sub>h</sub>(0), <italic>K</italic>, and <italic>&#x3bc;</italic>
<sub>h</sub> determine how the expected richness decreases. Henceforth we treat <italic>C</italic>
<sub>h</sub>(<italic>t</italic>) in our model as the expected value <inline-formula id="inf58">
<mml:math id="m65">
<mml:mi mathvariant="double-struck">E</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> derived from our stochastic birth-death model, <italic>i.e.</italic>, we use <italic>C</italic>
<sub>h</sub>(0)/(<italic>&#x3c8;</italic>(<italic>t</italic>) &#x2b; <italic>&#x3d5;</italic>(<italic>t</italic>)) as the model for <italic>C</italic>
<sub>h</sub>(<italic>t</italic>).</p>
<p>We will also simulate the stochastic birth-death process for HSCs (see <xref ref-type="sec" rid="s10">Supplementary Material</xref> for details), with the differentiation rate <italic>&#x3b1;</italic> that allows HSCs to differentiate into the progenitor/transit amplifying cell compartment (see <xref ref-type="fig" rid="F2">Figure 2</xref>). Progenitor cells are further distinguished by their generation <italic>&#x2113;</italic>. Thus, <italic>&#x2113;</italic> not only measures generation number but also an effective differentiation state. Each HSC differentiation event leads to an <italic>&#x2113;</italic> &#x3d; 0 progenitor cell. Since the number of HSCs of any one clone is small, the initial differentiation events from clone <italic>i</italic> follow a Poisson process with rate <italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>. The populations of the subsequent generations of progenitor cells in clone <italic>i</italic> are denoted by <inline-formula id="inf59">
<mml:math id="m66">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>. Once the <italic>&#x2113;</italic> &#x3d; 0 generation cells are generated, the number of progenitor cells quickly expand, so their dynamics will be described by a deterministic model as developed in (<xref ref-type="bibr" rid="B55">Xu et al., 2018</xref>)<disp-formula id="e8">
<mml:math id="m67">
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mtext>Poisson</mml:mtext>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>2</mml:mn>
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>2</mml:mn>
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x3c9;</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:mfenced>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:math>
<label>(8)</label>
</disp-formula>where Poisson(<italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>)) is the time-inhomogeneous point Poisson process describing HSC differentiation events. In other words, after a differentiation event at time <italic>t</italic>
<sub>1</sub>, the probability density of the time &#x394;<italic>t</italic> to the next differentiation event is given by <inline-formula id="inf60">
<mml:math id="m68">
<mml:mi>&#x3b1;</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">&#x394;</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mfenced open="[" close="]">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">&#x394;</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi>s</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:math>
</inline-formula>. We will use the values of <italic>h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) from our stochastic simulations and sample from this inter-event time density to simulate realizations of differentiation events.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Schematic of the hybrid stochastic-deterministic model. Tagged (barcoded) stem cells are transplanted into an animal initially with one cell (<italic>h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic> &#x3d; 0) &#x2248; 1) per clone. These cells, together with the untagged ones (<italic>h</italic>
<sub>0</sub>(<italic>t</italic> &#x3d; 0) &#x226B; 1) then undergo self-renewal and death, at rates <inline-formula id="inf61">
<mml:math id="m69">
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>h</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mfenced>
</mml:math>
</inline-formula> and <italic>&#x3bc;</italic>
<sub>h</sub>, respectively, in the bone marrow. HSCs in all clones are also assumed to undergo asymmetric differentiation with rate <italic>&#x3b1;</italic>, forming a zeroth-generation progenitor cells. The population of <italic>&#x2113;</italic>
<sup>th</sup>-generation (or stage) progenitor cells, denoted <inline-formula id="inf62">
<mml:math id="m70">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>, further symmetrically differentiate with each division, up to a maximum of <italic>&#x2113;</italic> &#x3d; <italic>L</italic> generations. The final-generation cell in clone <italic>i</italic> with population <inline-formula id="inf63">
<mml:math id="m71">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> can then undergo terminal differentiation at rate <italic>&#x3c9;</italic> to form mature, circulating peripheral blood cells. Mature cells at population <italic>m</italic>
<sub>
<italic>i</italic>
</sub> are then randomly sampled (with sampling fraction <italic>&#x3b7;</italic> and generating a sample population <italic>s</italic>
<sub>
<italic>i</italic>
</sub>) and sequenced. We wish to infer some of the parameters of the model by comparing the predicted means, standard deviations, and clone number densities with those from data (<xref ref-type="fig" rid="F1">Figure 1</xref>). Lineage differentiation is schematically shown as a splitting of the grey clone between generations <italic>&#x2113;</italic> &#x3d; 1 and <italic>&#x2113;</italic> &#x3d; 2, where a new cell type (squares) branches off. The division and death rates of progenitor cells in this new lineage, <inline-formula id="inf64">
<mml:math id="m72">
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> and <inline-formula id="inf65">
<mml:math id="m73">
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>, may be different, as may the maximum number of generations <italic>L</italic>&#x2032;. The mature cells turn over with rate a <italic>&#x3bc;</italic>
<sub>m</sub> that may depend on lineage (but not clone identity within each lineage). In this paper, we assume that the lineages diverge at the zeroth-generation progenitor cell and analyze the model after the first differentiation step (rate <italic>&#x3b1;</italic>) independently for different cell types (in this paper, granulocytes).</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g002.tif"/>
</fig>
<p>In Eq. <xref ref-type="disp-formula" rid="e8">8</xref>, <inline-formula id="inf66">
<mml:math id="m74">
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> and <inline-formula id="inf67">
<mml:math id="m75">
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> represent the proliferation and death rates of generation-<italic>&#x2113;</italic> progenitor cells, respectively, and <italic>&#x3c9;</italic> is the terminal differentiation rate into mature blood. Each division can also be thought of symmetric differentiation producing successively more differentiated progenitor cells. To model the finite proliferative potential of progenitor cells, we set the maximum number of generations to <italic>&#x2113;</italic> &#x3d; <italic>L</italic>, after which the <italic>L</italic>
<sup>th</sup> generation cell can only terminally differentiate to mature blood.</p>
<p>Consider a single isolated differentiation event of an HSC at <italic>t</italic> &#x3d; 0 belonging to a particular clone. The resulting progenitor cell population after this event is described by Eq. <xref ref-type="disp-formula" rid="e8">8</xref> without the Poisson(<italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>)) term but with an initial condition corresponding to a single <italic>&#x2113;</italic> &#x3d; 0 cell:<disp-formula id="e9">
<mml:math id="m76">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfenced open="{" close="">
<mml:mrow>
<mml:mtable class="cases">
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>1</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="left">
<mml:mn>0</mml:mn>
<mml:mspace width="1em"/>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mtext>otherwise.</mml:mtext>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:math>
<label>(9)</label>
</disp-formula>
</p>
<p>The subsequent populations at time <italic>t</italic> form a temporal &#x201c;burst&#x201d; of cells that are described by <inline-formula id="inf68">
<mml:math id="m77">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> which is the solution of Eq. <xref ref-type="disp-formula" rid="e8">8</xref> without the Poisson(<italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>)) term but using the initial condition in Eq. <xref ref-type="disp-formula" rid="e9">9</xref>. If we assume that all progenitor generations carry the same division and death rates, <inline-formula id="inf69">
<mml:math id="m78">
<mml:msubsup>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> for 0 &#x2264; <italic>&#x2113;</italic> &#x2264; <italic>L</italic> &#x2212; 1 and <inline-formula id="inf70">
<mml:math id="m79">
<mml:msubsup>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> for 0 &#x2264; <italic>&#x2113;</italic> &#x2264; <italic>L</italic>, we can find an analytical solution associated with a single isolated burst as<disp-formula id="e10">
<mml:math id="m80">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x3c9;</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfenced>
<mml:mo>!</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3c9;</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:msup>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3c9;</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mi>z</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>L</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>z</mml:mi>
</mml:mrow>
</mml:msup>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi>z</mml:mi>
<mml:mo>.</mml:mo>
</mml:math>
<label>(10)</label>
</disp-formula>We can evaluate all populations <inline-formula id="inf71">
<mml:math id="m81">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> for <italic>&#x2113;</italic> &#x3c; <italic>L</italic> by solving Eq. <xref ref-type="disp-formula" rid="e8">8</xref> and using Eq. <xref ref-type="disp-formula" rid="e10">10</xref>, as detailed in the <xref ref-type="sec" rid="s10">Supplementary Material</xref>.</p>
<p>If we assume that mature cells do not appreciably proliferate<xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref>, the mature cell population in clone <italic>i</italic> obeys<disp-formula id="e11">
<mml:math id="m82">
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3c9;</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
</mml:math>
<label>(11)</label>
</disp-formula>where <italic>&#x3bc;</italic>
<sub>m</sub> is the lineage-dependent turnover rate of mature cells. Using the solution to <inline-formula id="inf72">
<mml:math id="m83">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, we solve Eq. <xref ref-type="disp-formula" rid="e11">11</xref> to find (see <xref ref-type="sec" rid="s10">Supplementary Material</xref>)<disp-formula id="e12">
<mml:math id="m84">
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>&#x3c9;</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mo>&#x222b;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
<mml:msup>
<mml:mrow>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>.</mml:mo>
</mml:math>
<label>(12)</label>
</disp-formula>
</p>
<p>The mature cell population burst (of a specific clone) arising from a single, isolated differentiation event is plotted in <xref ref-type="fig" rid="F3">Figure 3A</xref>. Note that the expression for a mature cell burst given in Eq. <xref ref-type="disp-formula" rid="e12">12</xref> is derived from the specific initial condition Eq. <xref ref-type="disp-formula" rid="e9">9</xref>; however, some low-<italic>&#x2113;</italic> progenitors are also initially transplanted (see below). Thus, <italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) will in general depend on the initial numbers of <italic>n</italic>
<sup>(<italic>&#x2113;</italic>&#x3e;0)</sup>(0).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>
<bold>(A)</bold> The population <italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) of mature cells resulting from a single HSC differentiation event as obtained from Eq. <xref ref-type="disp-formula" rid="e12">12</xref>. <bold>(B)</bold> Multiple concatenated bursts from a low-population HSC clone showing well-separated intermittent pulses obtained <italic>via</italic> Eq. <xref ref-type="disp-formula" rid="e13">13</xref>. <bold>(C)</bold> When the HSC population of a clone is large, the resulting mature cell population bursts merge together and exhibit lower relative variability.</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g003.tif"/>
</fig>
<p>Since Eq. <xref ref-type="disp-formula" rid="e8">8</xref> are linear, populations arising from a sequence of Poisson-distributed differentiation events can be constructed by adding those derived from single events occurring at times <italic>T</italic>
<sub>
<italic>k</italic>
</sub>. In this case, the resulting mature cell population at time <italic>t</italic> is given by<disp-formula id="e13">
<mml:math id="m85">
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>max</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mspace width="1em"/>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>max</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3e;</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x3e;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>max</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:math>
<label>(13)</label>
</disp-formula>where <italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic> &#x2212; <italic>T</italic>
<sub>
<italic>k</italic>
</sub>) is the solution given in Eq. <xref ref-type="disp-formula" rid="e12">12</xref> (for the specific initial condition in Eq. <xref ref-type="disp-formula" rid="e9">9</xref>). Two different sequences of bursts are shown in <xref ref-type="fig" rid="F3">Figures 3B, C</xref>. In <xref ref-type="fig" rid="F3">Figure 3B</xref>, we consider a clone with few HSCs such that <italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) &#x226A; <italic>&#x3bc;</italic>
<sub>m</sub>. This limit gives rise to differentiation events that occur rarely over the lifespan of mature cells, as depicted <xref ref-type="fig" rid="F3">Figure 3B</xref>. In <xref ref-type="fig" rid="F3">Figure 3C</xref>, we plot a sequence of more frequent mature cell population bursts that arise for more frequent differentiation events <italic>&#x3b1;h</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) &#x226B; <italic>&#x3bc;</italic>
<sub>m</sub> from HSCs that are in higher population clones.</p>
<p>Recall that the calculations involving Eqs <xref ref-type="disp-formula" rid="e8">8</xref>&#x2013;<xref ref-type="disp-formula" rid="e12">12</xref> are performed for each clone <italic>i</italic>, resulting in a series of time-dependent expressions for <italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) as per Eq. <xref ref-type="disp-formula" rid="e12">12</xref>. These single event responses are then summed according to Eq. <xref ref-type="disp-formula" rid="e13">13</xref> to arrive at the total, time-dependent population of mature cells of a specific type and carrying the same barcode. These predicted whole-organism populations depend on the model parameters <inline-formula id="inf73">
<mml:math id="m86">
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>K</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3bc;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">m</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mi>L</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3c9;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:math>
</inline-formula>. Since growth of transit amplifying progenitor cells is fast, we will henceforth assume <italic>r</italic>
<sub>n</sub> &#x226B; <italic>&#x3bc;</italic>
<sub>n</sub> &#x2248; 0. All other rates are given in units of per day.</p>
<p>Since the clone abundances are derived from sequencing cells in a small fraction <italic>&#x3b7;</italic> (for rhesus macaque, <italic>&#x3b7;</italic> &#x223c; 10<sup>&#x2013;5</sup> &#x2212; 10<sup>&#x2013;4</sup>) of the animal&#x2019;s blood taken at times <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, we also need expressions for mature cell populations within a sample. Given the small sample sizes <italic>&#x3b7;</italic>, low population clones in the mature cell pool can easily be missed. For a given population <italic>m</italic>
<sub>
<italic>i</italic>
</sub> in the whole animal, the probability that <italic>s</italic>
<sub>
<italic>i</italic>
</sub> cells are captured in the sample is given by (<xref ref-type="bibr" rid="B10">Chao and Lin, 2012</xref>; <xref ref-type="bibr" rid="B54">Xu et al., 2020</xref>)<disp-formula id="e14">
<mml:math id="m87">
<mml:mtable class="aligned">
<mml:mtr>
<mml:mtd columnalign="right">
<mml:mi mathvariant="double-struck">P</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo stretchy="false">&#x7c;</mml:mo>
<mml:mfenced open="{" close="}">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mo>,</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>M</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mfrac linethickness="0">
<mml:mrow>
<mml:mi>M</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mfenced>
</mml:mrow>
</mml:mfrac>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x220f;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:munderover>
<mml:mfenced open="(" close=")">
<mml:mfrac linethickness="0">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mfenced>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd columnalign="right"/>
<mml:mtd columnalign="left">
<mml:mo>&#x2248;</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mo>&#x220f;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:munder>
<mml:mfenced open="(" close=")">
<mml:mfrac linethickness="0">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mfenced>
<mml:msup>
<mml:mrow>
<mml:mi>&#x3b7;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>&#x3b7;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
<label>(14)</label>
</disp-formula>where, for a given cell type (for example granulocytes), <italic>S</italic>(<italic>t</italic>) &#x3d; <italic>&#x2211;</italic>
<sub>
<italic>i</italic>&#x3d;0</sub>
<italic>s</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) is the total number of sampled cells (including untagged ones), <italic>M</italic>(<italic>t</italic>) &#x3d; <italic>&#x2211;</italic>
<sub>
<italic>i</italic>&#x3d;0</sub>
<italic>m</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>) is the total number of circulating mature cells (including untagged ones), and the sampling fraction is <italic>&#x3b7;</italic> &#x3d; <italic>S</italic>/<italic>M</italic> (which we first assume is the same at each <italic>t</italic>
<sub>
<italic>j</italic>
</sub>).</p>
<p>After computing <italic>m</italic>
<sub>
<italic>i</italic>
</sub> at time <italic>t</italic>
<sub>
<italic>j</italic>
</sub> using Eq. <xref ref-type="disp-formula" rid="e12">12</xref>, we take the nearest integer value and use it for <italic>m</italic>
<sub>
<italic>i</italic>
</sub> in Eq. <xref ref-type="disp-formula" rid="e14">14</xref>. We then draw a single value <italic>s</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) from the binomial distribution, assuming <italic>&#x3b7;</italic> is given. Finally, we simulate our model to generate trajectories of <italic>M</italic>(<italic>t</italic>) and then determine the tagged sampled fraction<disp-formula id="e15">
<mml:math id="m88">
<mml:mi>S</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x2248;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mi>&#x3b7;</mml:mi>
<mml:mi>M</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>.</mml:mo>
</mml:math>
<label>(15)</label>
</disp-formula>
</p>
<p>Equations <xref ref-type="disp-formula" rid="e5">5</xref>&#x2013;<xref ref-type="disp-formula" rid="e15">15</xref> represent a hybrid stochastic-deterministic model since the self-renewal process of a small number of HSCs in each clone and the final sampling step (Eq. <xref ref-type="disp-formula" rid="e14">14</xref>) are modeled as discrete stochastic processes, while proliferation and differentiation of higher population progenitor and mature cells are treated deterministically <italic>via</italic> Eqs <xref ref-type="disp-formula" rid="e8">8</xref>&#x2013;<xref ref-type="disp-formula" rid="e12">12</xref>. The values <italic>s</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) obtained from the model in Eqs <xref ref-type="disp-formula" rid="e8">8</xref>&#x2013;<xref ref-type="disp-formula" rid="e14">14</xref> are used to generate the predicted clone population mean and standard deviations, <italic>s</italic>
<sub>
<italic>i</italic>
</sub> and <italic>&#x3c3;</italic>
<sub>
<italic>i</italic>
</sub>, according to Eq. <xref ref-type="disp-formula" rid="e1">1</xref>. Both <italic>s</italic>
<sub>
<italic>i</italic>
</sub>, <italic>&#x3c3;</italic>
<sub>
<italic>i</italic>
</sub> are then used to determine the density of points <italic>&#x3c1;</italic>
<sub>
<italic>i</italic>
</sub>. These three values for each clone are then compared to their corresponding values constructed from data <inline-formula id="inf74">
<mml:math id="m89">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, as we detail in the next section. These predictions, along with the predicted richness <italic>C</italic>
<sub>s</sub>(<italic>t</italic>) and total sampled granulocyte population <italic>S</italic>(<italic>t</italic>) provide the basis for comparing with measured data and parameter inference.</p>
</sec>
</sec>
<sec id="s3">
<title>Data analysis and results</title>
<sec id="s3-1">
<title>Data presentation</title>
<p>The published experimental data in (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) provide data for four rhesus macaques ZH33, ZG66, ZH19, and ZJ31 over a period of 49, 42, 36 and 20&#xa0;months, respectively. Samples were taken after autologous transplantation with myeloablative conditioning at times <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, 1 &#x2264; <italic>j</italic> &#x2264; <italic>J</italic>. Possible sampled cells are of five types: T cells, B cells, monocytes, granulocytes and NK cells. Barcoded myeloid (granulocytes and monocytes) and B-cells reach a noisy equilibrium after approximately 1&#xa0;month, whereas for T-cells the time frame is longer, between 5 to 17&#xa0;months. Furthermore, since granulocytes comprise a majority of white blood cells, we apply our mathematical and statistical model to the granulocyte lineage. At each sampling time <italic>t</italic>
<sub>
<italic>j</italic>
</sub>, the experimental data from (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) reveals how many cells are sampled from each clone and what type each cell is. Across sampling time points, these sampled populations contain information on the overall abundance, how these abundances fluctuate in time, and the density of the number of clones detected as a function of abundance and abundance variability. Since ZH33 has the longest follow-up period, we use data from this macaque to compare experimental data with our mathematical predictions.</p>
</sec>
<sec id="s3-2">
<title>Matching model to data</title>
<p>Validation of our model will rely on matching predictions with available data in the form of <inline-formula id="inf75">
<mml:math id="m90">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf76">
<mml:math id="m91">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, and <inline-formula id="inf77">
<mml:math id="m92">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. Since the model contains many parameters and the data is noisy and &#x201c;sparse,&#x201d; the model will likely overfit. Therefore, we carry out the parameter estimation by hand in stages, imposing limit on parameter values that are physiologically feasible.</p>
<p>First, we compare <italic>C</italic>
<sub>h</sub>(<italic>t</italic>) (Eq. <xref ref-type="disp-formula" rid="e6">6</xref>) with the richness <inline-formula id="inf78">
<mml:math id="m93">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> shown in <xref ref-type="fig" rid="F1">Figure 1A</xref> to provide a constraint among <italic>&#x3bc;</italic>
<sub>h</sub>, <italic>K</italic>, <italic>C</italic>
<sub>h</sub>(0), and <italic>r</italic>
<sub>h</sub>(0). We assume that the <italic>C</italic>
<sub>h</sub>(0) associated with granulocytes is slightly greater than the total richness across all samples after the first two, <inline-formula id="inf79">
<mml:math id="m94">
<mml:msub>
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">h</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2273;</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>. This is equivalent to assuming that granulocyte richness after about 2&#x00A0;months arises solely from barcoded HSCs. The cumulative post-two-month richnesses <inline-formula id="inf80">
<mml:math id="m95">
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula> for animals ZH33, ZG66, ZH19, and ZJ31 are 2,335, 2007, 4,007, and 30732, respectively. Although the sample specific <inline-formula id="inf81">
<mml:math id="m96">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> quickly decreases for <italic>t</italic> &#x3e; <italic>t</italic>
<sub>1</sub>, our model prediction for <italic>C</italic>
<sub>h</sub>(<italic>t</italic>) follows Eq. <xref ref-type="disp-formula" rid="e6">6</xref> and decays more slowly. By estimating <italic>C</italic>
<sub>h</sub>(0) and using Eq. <xref ref-type="disp-formula" rid="e6">6</xref>, we generate the predicted <italic>C</italic>
<sub>s</sub>(<italic>t</italic>) and <italic>S</italic>(<italic>t</italic>) by simulating our full model and comparing them to <inline-formula id="inf82">
<mml:math id="m97">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf83">
<mml:math id="m98">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. This allows us to further constrain the parameters <italic>C</italic>
<sub>h</sub>(0), <italic>r</italic>
<sub>h</sub>(0), <italic>K</italic>, and <italic>&#x3bc;</italic>
<sub>h</sub>. Note that no analytic formula exists for <italic>C</italic>
<sub>s</sub>(<italic>t</italic>).</p>
<p>We first set <italic>K</italic> &#x2248; 100<italic>C</italic>
<sub>h</sub>(0) as the niche carrying capacity since smaller or larger values of <italic>K</italic> cannot provide the correct average clone sizes or approximately matching values of <italic>C</italic>
<sub>s</sub>. This comparison allowed us to obtain rough constraints and approximations to some parameters, particularly <italic>&#x3bc;</italic>
<sub>h</sub>, <italic>r</italic>
<sub>h</sub>(0), and <italic>C</italic>
<sub>h</sub>(0). Discrete sets of values that are consistent with <inline-formula id="inf84">
<mml:math id="m99">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> were selected and further pruned by using the remaining data.</p>
<p>The sampled richness <inline-formula id="inf85">
<mml:math id="m100">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> in ZH33 exhibits a sharp decrease after the first sample time, without a corresponding collapse in the sampled abundances of granulocytes <inline-formula id="inf86">
<mml:math id="m101">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. Our model explains this phenomenon by the initial condition; namely, the initially transplanted population of CD34<sup>&#x2b;</sup> cells contains some partially differentiated HSPCs. Progenitor cells of barcode <italic>i</italic> (described in our model by the populations <inline-formula id="inf87">
<mml:math id="m102">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
</mml:math>
</inline-formula>) are initially transplanted so that some <inline-formula id="inf88">
<mml:math id="m103">
<mml:msubsup>
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3e;</mml:mo>
<mml:mn>0</mml:mn>
</mml:math>
</inline-formula> particularly for small <italic>&#x2113;</italic> (cells with a low degree of differentiation).</p>
<p>As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, a fraction of the initial clones are HSPCs. Once these HSPC clones generate a burst of mature cells, they disappear from the animal without being renewed since there are no corresponding HSCs carrying the same barcode. Thus, the HSPC contribution to the overall sampled richness <inline-formula id="inf89">
<mml:math id="m104">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> largely disappears after about 2&#xa0;months. However, the total mature granulocyte population <inline-formula id="inf90">
<mml:math id="m105">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> does not suffer a decline since HSPCs lost due to terminal differentiation are replaced by HSC differentiation. The subsequently sampled mature cell richness then reflects the richness <italic>C</italic>
<sub>h</sub>(0) of the initially transplanted HSCs. We propose this partial HSPC transplantation as a mechanism for the observed rapid decrease in <inline-formula id="inf91">
<mml:math id="m106">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> observed in some animals. The shape of <inline-formula id="inf92">
<mml:math id="m107">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> (see <xref ref-type="fig" rid="F7">Figure 7D</xref>) can inform our estimate of the initial progenitor population <italic>n</italic>
<sup>(<italic>&#x2113;</italic>)</sup>(<italic>t</italic> &#x3d; 0). Maxima in <inline-formula id="inf93">
<mml:math id="m108">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> can be accounted for by offspring of initially transplanted progenitor cells of different stages <italic>&#x2113;</italic>, with <italic>n</italic>
<sup>(<italic>&#x2113;</italic>)</sup>(0) generating smaller clones for larger <italic>&#x2113;</italic> (fewer remaining generations to expand).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Schematic of a mixed HSC/HSPC initial condition. The transplanted CD34<sup>&#x2b;</sup> cells contain HSCs and some progenitor cells (HSPCs), which are exhausted after about 2&#xa0;months. The remaining richness arises mainly from that of the long term HSCs <italic>C</italic>
<sub>h</sub>(0) which then slowly decreases as certain HSC clones become extinct.</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g004.tif"/>
</fig>
<p>Next, we consider the small clones, predominantly arising at short times, and find their average value at the first sample taken at <italic>t</italic>
<sub>1</sub>. These small clones also yield the highest density values <inline-formula id="inf94">
<mml:math id="m109">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, but mostly disappear at longer times. Therefore, we assume they predominantly arise from initial progenitor cells. We can then generate the prediction <italic>m</italic>(<italic>t</italic> &#x3d; <italic>t</italic>
<sub>1</sub>) from our model assuming an initial condition <italic>n</italic>
<sup>
<italic>&#x2113;</italic>
</sup>(0) (and assuming no HSC contribution by setting <italic>&#x3b1;</italic> &#x3d; 0). This approximation provides a constraint on the deterministic progenitor cell parameters <italic>r</italic>
<sub>n</sub>, <italic>L</italic>, <italic>&#x3c9;</italic>, <italic>&#x3b7;</italic>. In these experiments, the typical <italic>&#x3b7;</italic> &#x223c; 10<sup>&#x2013;5</sup>, so we find that <italic>L</italic> &#x3d; 22, and collect a set of feasible values for <italic>r</italic>
<sub>n</sub>, <italic>&#x3c9;</italic>, and <italic>&#x3b7;</italic> that provide a good starting point for estimating the other parameters in the model. Note that <italic>r</italic>
<sub>n</sub>, <italic>L</italic>, <italic>&#x3c9;</italic>, <italic>&#x3b7;</italic> can largely compensate each other at this level of comparison. In other words, sets of different ranges of values of one parameter will fit equally well provided some other parameters are also correspondingly adjusted.</p>
<p>Next, we least-squares minimize <inline-formula id="inf95">
<mml:math id="m110">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, where the model prediction <italic>S</italic>(<italic>t</italic>) is given by Eq. <xref ref-type="disp-formula" rid="e15">15</xref>. This further helps fix <italic>&#x3b1;</italic>. Once a set of parameters that allow for a reasonable match of <italic>C</italic>
<sub>s</sub>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) and <italic>S</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) have been defined, as shown in <xref ref-type="fig" rid="F5">Figures 5A, B</xref>, we then refine the fitting to the mean&#x2212;standard deviation <inline-formula id="inf96">
<mml:math id="m111">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> scatter plot shown in <xref ref-type="fig" rid="F1">Figure 1D</xref>.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>For animal ZH33, coarse fitting to the total population of tagged granulocytes <italic>S</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) <bold>(A)</bold>, and the total number of clones at each time point <italic>C</italic>
<sub>s</sub>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) <bold>(B)</bold>. This initial rough matching was achieved using parameter values <italic>L</italic> &#x3d; 22, <italic>r</italic>
<sub>n</sub> &#x2248; 2, <italic>&#x3c9;</italic> &#x2248; 0.2, and sampling size <italic>&#x3b7;</italic> &#x3d; 10<sup>&#x2013;5</sup>.</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g005.tif"/>
</fig>
<p>To compare our modeling results to the remaining experimental data (<inline-formula id="inf97">
<mml:math id="m112">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, and <inline-formula id="inf98">
<mml:math id="m113">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>) and to fine-tune the estimates of the other parameters, the most natural intuition would be to compute the Euclidean distance (or any other relevant distance metric) between model predictions and experimental datasets and tune parameters so as to minimize this distance. However, since a number of clones go extinct in our model, the data size (for <inline-formula id="inf99">
<mml:math id="m114">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, and <inline-formula id="inf100">
<mml:math id="m115">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>) varies in time.</p>
<p>Thus, before comparing predicted clone size distributions to measured results, we first cluster the data according to the values of <inline-formula id="inf101">
<mml:math id="m116">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> and <inline-formula id="inf102">
<mml:math id="m117">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>. Recall that <inline-formula id="inf103">
<mml:math id="m118">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2248;</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> (since <italic>&#x3c3;</italic> is highly correlated with <italic>s</italic>) is still determined from KDE using the raw, unclustered data <inline-formula id="inf104">
<mml:math id="m119">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. Clustering is performed using <italic>k</italic>-means to partition the data into multiple regions (in <inline-formula id="inf105">
<mml:math id="m120">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>- and <inline-formula id="inf106">
<mml:math id="m121">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>-space) such that the Euclidean distance between a point and the center of its cluster is smaller than its distance to all other cluster centers. The goal is not to cluster the <inline-formula id="inf107">
<mml:math id="m122">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> points according to any real feature, but to simply reduce the dimensionality of the problem and to control the number of effective data points before applying least squares comparisons. Although there are no obvious features in the <inline-formula id="inf108">
<mml:math id="m123">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> data, <italic>k</italic>-means clustering of the distribution of points does yield an optimal number of clusters <italic>k</italic>&#x2a; <italic>via</italic> the &#x201c;elbow&#x201d; method where the curvature of the sum of square errors (distortion score) is maximal (<xref ref-type="bibr" rid="B57">Yuan and Yang, 2019</xref>). After implementing <italic>k</italic>-means clustering using the Python <italic>yellowbrick</italic> package, we find that the optimal number of clusters is typically <italic>k</italic>&#x2a; &#x2248; 50 &#xb1; 3 depending on the initial randomization and partitioning process. Subsequent results, however, are insensitive to the precise numbers of clusters used as long as <italic>k</italic>&#x2a; &#x2248; 50.</p>
<p>
<xref ref-type="fig" rid="F6">Figure 6A</xref> compares <inline-formula id="inf109">
<mml:math id="m124">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> from experiments and from our hybrid multicompartment model. <xref ref-type="fig" rid="F6">Figure 6B</xref> shows the distortion score (blue) and the convergence time (green) as a function of the number of clusters. The optimal number of clusters <italic>k</italic>&#x2a; &#x3d; 48 arises at the elbow of the distortion score curve. <xref ref-type="fig" rid="F6">Figure 6C</xref> shows the clustered data (for animal ZH33) against the clustered model predictions. The radius of each circle, <italic>w</italic>
<sub>
<italic>k</italic>
</sub>, <italic>k</italic> &#x3d; 1, &#x2026;, 53 denotes the fraction of data points (fraction of the total number of observed clones) assigned to cluster <italic>k</italic> and is thus a coarse-grained representation of the local data density.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>A total of 48 clusters are identified <italic>via</italic> <italic>k</italic>-means clustering of the data from animal ZH33. <bold>(A)</bold> The unclustered <inline-formula id="inf110">
<mml:math id="m125">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> data and model predictions for an arbitrary set of parameters. <bold>(B)</bold> The squared errors in <italic>k</italic>-means clustering or distortion score (blue) and convergence time (green) as a function of the number of clusters. The optimal value from the elbow signalling diminishing returns was found in this case to be <italic>k</italic>&#x2a; &#x3d; 48. <bold>(C)</bold> The location of the cluster centers plotted on the <inline-formula id="inf111">
<mml:math id="m126">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> plane. The radius of each circle indicates the fraction of all clones <italic>w</italic>
<sub>
<italic>k</italic>
</sub> that are associated with cluster <italic>k</italic> and is set to 2000<italic>w</italic>
<sub>
<italic>k</italic>
</sub>.</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g006.tif"/>
</fig>
<p>Thus, we have clustered measured data according to <inline-formula id="inf112">
<mml:math id="m127">
<mml:mi>P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>p</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>p</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
<mml:mo>&#x2261;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf113">
<mml:math id="m128">
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> denotes the center values of cluster <italic>k</italic> and <inline-formula id="inf114">
<mml:math id="m129">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the area of the <italic>k</italic>
<sup>th</sup> cluster. For a fixed set of all model parameters, we generate predictions <inline-formula id="inf115">
<mml:math id="m130">
<mml:mi>Q</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>q</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>q</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>g</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
<mml:mo>&#x2261;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> (in this expression and in the following, <italic>&#x2113;</italic>, <italic>&#x2113;</italic>&#x2a; denote matrix indices and not progenitor cell generations). The optimal number of clusters derived from our hybrid stochastic-deterministic model, <italic>&#x2113;</italic>&#x2a; will in general be different from the number of clusters <italic>k</italic>&#x2a; derived from data, but is typically also about <italic>&#x2113;</italic>&#x2a; &#x2248; 50.</p>
<p>In order to compare the clustered data <italic>P</italic> to the model prediction <italic>Q</italic>, which are matrices with different numbers of rows, we use the Wasserstein metric, or Earth mover&#x2019;s distance (EMD) (<xref ref-type="bibr" rid="B51">Villani, 2009</xref>; <xref ref-type="bibr" rid="B29">Kolouri et al., 2017</xref>) to define a distance between them. Let <italic>d</italic>
<sub>
<italic>k</italic>,<italic>&#x2113;</italic>
</sub> denote the distance between cluster <italic>p</italic>
<sub>
<italic>k</italic>
</sub> and cluster <italic>q</italic>
<sub>
<italic>&#x2113;</italic>
</sub> so that the matrix a <bold>d</bold> &#x3d; {<italic>d</italic>
<sub>
<italic>k</italic>,<italic>&#x2113;</italic>
</sub>} catalogues all possible cluster-cluster distances. We aim to compute a flow map <bold>f</bold> &#x3d; {<italic>f</italic>
<sub>
<italic>k</italic>,<italic>&#x2113;</italic>
</sub>} that yields the minimal distance between clusters <bold>p</bold> &#x3d; {<italic>p</italic>
<sub>
<italic>k</italic>
</sub>} and clusters <bold>q</bold> &#x3d; {<italic>q</italic>
<sub>
<italic>&#x2113;</italic>
</sub>} by finding<disp-formula id="e16">
<mml:math id="m131">
<mml:msub>
<mml:mrow>
<mml:mtext>min</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold">f</mml:mi>
</mml:mrow>
</mml:msub>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
<label>(16)</label>
</disp-formula>
</p>
<p>Subject to the constraints<disp-formula id="e17">
<mml:math id="m132">
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
<mml:mspace width="2em"/>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mspace width="2em"/>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:math>
<label>(17)</label>
</disp-formula>
</p>
<p>For all 1 &#x2264; <italic>k</italic> &#x2264; <italic>k</italic>&#x2a; and 1 &#x2264; <italic>&#x2113;</italic> &#x2264; <italic>&#x2113;</italic>&#x2a; and<disp-formula id="e18">
<mml:math id="m133">
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
</mml:math>
<label>(18)</label>
</disp-formula>
</p>
<p>After finding the optimal flow <bold>f</bold>, we evaluate the EMD as<disp-formula id="e19">
<mml:math id="m134">
<mml:mi mathvariant="normal">E</mml:mi>
<mml:mi mathvariant="normal">M</mml:mi>
<mml:mi mathvariant="normal">D</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>Q</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>k</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:munderover accentunder="false" accent="true">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munderover>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>&#x2113;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2032;</mml:mo>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:mo>.</mml:mo>
</mml:math>
<label>(19)</label>
</disp-formula>
</p>
<p>Model parameters are varied until our model-derived predictions best match the clustered data by minimizing the EMD. In this paper, we consider only the granulocyte lineage since it is the most abundant and reliably measured with minimal complex dynamics and regulation.</p>
<p>Finally, note the fluctuations in <italic>S</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) which are too large to be captured by the intrinsic stochasticity in our model, as indicated in <xref ref-type="fig" rid="F5">Figure 5B</xref>. These &#x201c;unknown&#x201d; fluctuations can arise from a number of processes, including variable sampling fractions <italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) at each time point <italic>t</italic>
<sub>
<italic>j</italic>
</sub> and fluctuating animal state due to infections, stress, inflammation, etc. These may influence total mature cell populations month to month. Some of these effects can be effectively accounted for by adjusting the mean sample fraction <italic>&#x3b7;</italic> &#x3d; 10<sup>&#x2013;5</sup> by an amount &#x394;<italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) at each time point. Using these values of &#x394;<italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) to match the data <italic>S</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>), and then readjusting the parameters, we find good comparison between the experimental measurements and our model, as shown in <xref ref-type="fig" rid="F7">Figures 7A&#x2013;C</xref>.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Fitting of tagged granulocyte populations for animal ZH33 after time-dependent adjustment of sampling size <italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>). For this animal <italic>t</italic>
<sub>
<italic>j</italic>
</sub> &#x3d; [1, 2, 3, 4.5, 6.5, 9.5, 12, 14, 21, 28, 30, 38, 43, 46, 49] months. <bold>(A)</bold> By initially best-matching <italic>S</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>), we find <italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) &#x3d; [1, 2.03, 1.07, 0.94, 0.68, 1.25, 0.61, 0.83, 1.29, 1.29, 1.01, 1.01, 0.99, 1.14, 0.83]&#xd7;10<sup>&#x2013;5</sup>. <bold>(B&#x2013;D)</bold> By searching parameter space to find a good match to <inline-formula id="inf116">
<mml:math id="m135">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>, and <inline-formula id="inf117">
<mml:math id="m136">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> (which is shown with its maximum nnormalized to one), which is plotted with its maximum normalized to unity. We find parameters [in units of/day] that fit the data are <italic>&#x3bc;</italic>
<sub>h</sub> &#x3d; 0.02, <italic>r</italic>
<sub>h</sub>(0) &#x3d; 0.08, <italic>C</italic>
<sub>h</sub>(0) &#x3d; 2500, <italic>C</italic>
<sub>n</sub>(<italic>&#x2113;</italic> &#x3d; 0) &#x3d; 800, <italic>C</italic>
<sub>n</sub>(<italic>&#x2113;</italic> &#x3d; 1) &#x3d; 1600, <italic>C</italic>
<sub>n</sub>(<italic>&#x2113;</italic> &#x3d; 2) &#x3d; 3200, <italic>K</italic> &#x3d; 2.5&#xd7;10<sup>5</sup>, <italic>&#x3b1;</italic> &#x3d; 0.016, <italic>r</italic>
<sub>n</sub> &#x3d; 2, <italic>L</italic> &#x3d; 22, <italic>&#x3bc;</italic>
<sub>n</sub> &#x3d; 0, <italic>&#x3bc;</italic>
<sub>m</sub> &#x3d; 0.185 and <italic>&#x3c9;</italic> &#x3d; 0.2.</p>
</caption>
<graphic xlink:href="fsysb-03-893366-g007.tif"/>
</fig>
<p>To further show consistency, we then plotted the predicted density and compare it with the data-derived (using KDE) density <inline-formula id="inf118">
<mml:math id="m137">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> in <xref ref-type="fig" rid="F7">Figure 7D</xref>. A few large, highly variable clones remain not well reproduced by our model and are discussed in the next section. The parameter estimation procedure was applied to the three other animals in (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>), showing reasonable, consistent matching (see <xref ref-type="sec" rid="s10">Supplementary Material</xref>).</p>
</sec>
</sec>
<sec id="s4">
<title>Discussion and conclusion</title>
<p>In this paper, we analyzed data from stem cell transplantation experiments in rhesus macaque (<xref ref-type="bibr" rid="B28">Koelle et al., 2017</xref>) in which barcoded stem and progenitor cells (HSPCs) were autologously transplanted after myeloablative conditioning. Typically, of the <inline-formula id="inf119">
<mml:math id="m138">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>30</mml:mn>
</mml:math>
</inline-formula> million cells transplanted only <inline-formula id="inf120">
<mml:math id="m139">
<mml:mo>&#x223c;</mml:mo>
<mml:mn>15</mml:mn>
<mml:mo>&#x2013;</mml:mo>
<mml:mn>35</mml:mn>
<mml:mi>%</mml:mi>
</mml:math>
</inline-formula> are tagged and then only a fraction homes to functional bone marrow niches. Nonetheless, typically hundreds or thousands of barcodes are detected in peripheral blood samples. The counts of circulating mature cells derived from each clone fluctuate from sample to sample; these fluctuations are significantly larger than those expected from random small samples (<xref ref-type="bibr" rid="B55">Xu et al., 2018</xref>) and thus arise from intrinsic stochasticity (<xref ref-type="bibr" rid="B2">Abkowitz et al., 1996</xref>) during hematopoiesis and/or physiological changes in the animals over the months that samples were being drawn.</p>
<p>In order to explain clone size variability, we extend a mathematical model first presented in (<xref ref-type="bibr" rid="B55">Xu et al., 2018</xref>). Our hybrid stochastic-deterministic model delineates all the clone populations and assumes regulation of the stem cell proliferation rate through a carrying capacity <italic>K</italic>, a finite differentiation potential of progenitor cells, terminal differentiation after a fixed number of divisions, and a final sampling step. Since the numbers of HSCs within each clone are typically small, we treated the self-renewal of HSCs within its niche stochastically by a coupled (through the carrying capacity) discrete birth-death process for each clone. In (<xref ref-type="bibr" rid="B55">Xu et al., 2018</xref>), the coupling in the stochastic HSC birth-death process was treated using a mean field approximation, which leads to a smaller clone size variability, everything else equal. Random times of asymmetric differentiation of each HSC into the first-stage progenitor cell is described by a rate <italic>&#x3b1;</italic>. After <italic>L</italic> differentiation steps, the <italic>L</italic>
<sup>th</sup>-stage progenitor cell terminally differentiates into a mature, circulating blood cell. The progenitor and mature cell pools are treated deterministically. We performed stochastic simulations using the Gillespie algorithm (<xref ref-type="bibr" rid="B5">Bortz et al., 1975</xref>; <xref ref-type="bibr" rid="B21">Gillespie, 2007</xref>) of the entire HSC pool and solve for the progenitor and mature cell populations numerically. Additional feedback mechanisms between the HSC and progenitor pools can be implemented (<xref ref-type="bibr" rid="B27">Klose et al., 2019</xref>), but in our case would require a more complex model incorporating two-way coupling between stochastic and deterministic dynamics.</p>
<p>Our model suggests that the sampled clone abundance variation arises primarily from random differentiation events by HSC clones that occur at rate <italic>&#x3b1;</italic>. Each differentiation event leads to a temporal burst of mature cells of the same clone. We hypothesize that these bursts of mature cell production lead to the variability in sampled clone populations. Other physiological factors related to animal state may still also play a role, but are not considered in our model. Another feature captured by our current model is the transient richness immediately after transplantation. This behavior is explained by our initial condition that contains short-term HSPCs that are within the initial CD34<sup>&#x2b;</sup> pool. These HSPCs quickly differentiate but are not replenished at long times. This distributed initial condition may depend on the experimental protocol and may be indicative of the efficiency, and especially, the composition of the transplant.</p>
<p>Our model also allows us to explore how clone abundance predictions change with parameters. For example, we find that the range of larger clone sizes increase with increases in <italic>L</italic>, <italic>K</italic>, and <italic>&#x3b1;</italic>, in this order. All parameters affect the density of predicted data and cluster sizes. Mature cell death rates, which vary across different cell types, also affect the predicted abundance variations, especially for larger values of <italic>&#x3bc;</italic>
<sub>m</sub>.</p>
<p>We also note that while percentage of GFP&#x2b; cells within each mature cell type (lineage) fluctuated from sample to sample, they generally increased with animal age (after transplant) for all animals. T cells had the largest increase in their barcoded populations during the handful of months after transplantation. Since this timescale is much longer than the progenitor cell transients, this slow increase in tagged cell populations suggests that, assuming a neutral model (barcodes and barcode integration sites do not affect cell proliferation and death rates), (i) that a certain fraction of HSCs remained <italic>in situ</italic> after radiative ablation, and (ii) the CD34<sup>&#x2b;</sup> barcoded and transplanted HSC population with an enriched GFP&#x2b; fraction were slowly activated. Scenario (i) means that some HSCs remained in their niche and continuously generated blood. The transplanted cells with barcoded HSCs (GFP&#x2b;) can increase in importance if they slowly become more proliferative as they settle into the animal. Thus, the slow increase in GFP&#x2b; fraction in all five measured lineages suggest that transplanted cells may recover slowly from the transplantation procedure and increase their contribution to mature blood cell formation.</p>
<p>Finally, we note that there appears to be additional fluctuation mechanisms that are not accounted for in our model. In all animals, there appears to be a few very large clones with very high variability <inline-formula id="inf121">
<mml:math id="m140">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>. Within a stochastic HSC population, adjusting birth-death parameters that allow for larger clones and larger variances would suppress the richness to below what is observed. We have extensively explored feasible regimes of all parameters and conclude that allowing large clones that vary in abundance precludes agreement with other basic observables such as <inline-formula id="inf122">
<mml:math id="m141">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf123">
<mml:math id="m142">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>. Nonetheless, such unexplained features can be mechanistically informative and we discuss a number of reasonable factors that may account for them. First, the fluctuations in the measured total abundances of the different mature cell lineages did not correlate, implying that the specific set of sampling sizes <italic>&#x3b7;</italic>(<italic>t</italic>
<sub>
<italic>j</italic>
</sub>) used to explain granulocyte population variations (as shown in <xref ref-type="fig" rid="F7">Figure 7</xref>) cannot be used to analyze those of other mature cell lineages. The seemingly uncorrelated cross-lineage populations imply that time variations in animal state arise further downstream, affecting the development of individual lineages. If fluctuations occurred in stem or multipotent progenitor cells, they would affect multiple cell lineages in similar ways and lead to inter-lineage population correlations.</p>
<p>Animal ZJ31 (see <xref ref-type="sec" rid="s10">Supplementary Material</xref>) appears to be uniquely different from the others in that it exhibited a much larger richness <inline-formula id="inf124">
<mml:math id="m143">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> as well as a much smaller maximum clone size (which non-etheless had high variance <inline-formula id="inf125">
<mml:math id="m144">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>&#x3c3;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula>). For example, <italic>C</italic>
<sub>s</sub> at <italic>t</italic>
<sub>
<italic>j</italic>
</sub> &#x3d; 5 months dips to a very low value, while the abundance <inline-formula id="inf126">
<mml:math id="m145">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> seems to be at a local maximum. Thus, a small number of granulocyte clones expanded dramatically, potentially squeezing out the many smaller clones below sampling. At month seven, <inline-formula id="inf127">
<mml:math id="m146">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is extremely low but <inline-formula id="inf128">
<mml:math id="m147">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> has recovered to its long term value, indicating that the previously large granulocyte clones were quickly cleared out. The results for ZJ31 may indicate a lower level of competitive exclusion, but also some other mechanism contributing to high variability. Therefore, the overall observation of high variability and the magnitudes of <inline-formula id="inf129">
<mml:math id="m148">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">s</mml:mi>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> indicates that other model features should be considered.</p>
<p>One assumption of our model that is likely an oversimplification is the neutrality of barcodes. Although different barcodes themselves may not influence cells, different VISs may. For example, aberrant self-renewal arises when using lentiviral vectors (<xref ref-type="bibr" rid="B18">Espinoza et al., 2019</xref>) and different VISs of HIV have been shown to affect cellular proliferation rates (<italic>e.g.</italic>, if the VIS is near an oncogene) <xref ref-type="bibr" rid="B56">Yeh et al. (2021)</xref>. Besides the non-neutrality, we have also neglected stochastic or variable proliferative potential <italic>L</italic> and the time course of the HSC homing and engraftment into the bone marrow. A random but distributed <italic>L</italic> would allow a few randomly selected clones to expand further. We also expect that HSC migration and successful settlement into the bone marrow niche is a time-continuous process that provide a proliferation head start for a few early arriving clones. This would ultimately result in fewer clones <italic>C</italic>
<sub>s</sub> with some of them at higher populations <italic>s</italic>
<sub>
<italic>i</italic>
</sub>(<italic>t</italic>). An instantaneous (more abrupt) HSC engraftment and a larger spread in <italic>L</italic> would be more consistent with animal ZJ31 than with the others.</p>
<p>Additional information can be extracted from the clone abundance data to further identify and interrogate such &#x201c;opposing&#x201d; behaviors. For example, we have only considered the average autocorrelation of the clone abundances (the variance) and have not constructed cross-correlations between cell types/lineages or correlations across time. Except for the initial period after transplantation, we have assumed a time-inhomogeneous process and have not considered explicit time-dependence such as aging (<xref ref-type="bibr" rid="B37">Muller-Sieburg et al., 2012</xref>; <xref ref-type="bibr" rid="B15">de Haan and Lazare, 2018</xref>). Physiological aging can be straightforwardly incorporated by <italic>e.g.,</italic> allowing for slow degradation of HSCs, changes in progenitor proliferative potential (<xref ref-type="bibr" rid="B34">Marciniak-Czochra et al., 2009</xref>), or changes in HSC niche carrying capacity <italic>K</italic>(<italic>t</italic>). Mutations that arise with age may also <italic>increase</italic> HSC self-renewal (<xref ref-type="bibr" rid="B9">Challen and Goodell, 2020</xref>) which could be modeled by a <italic>r</italic>
<sub>h</sub>(0) that increases with time. Thymic interruptions or involution with age (<xref ref-type="bibr" rid="B31">Lewkiewicz et al., 2019a</xref>,<xref ref-type="bibr" rid="B32">b</xref>) could also be modeled by assuming a decreasing maturation rate <italic>&#x3c9;</italic>(<italic>t</italic>) when considering the T cell lineage.</p>
<p>While our current model contains a large number of parameters, it seems that a number of them are compensatory and control specific properties of the model predictions. For example, we found that <italic>&#x3b1;</italic>, <italic>L</italic>, <italic>&#x3c9;</italic>, and <italic>&#x3b7;</italic> can compensate for each other and form an unknown effective parameter function <italic>f</italic>(<italic>&#x3b1;</italic>, <italic>L</italic>, <italic>&#x3c9;</italic>, <italic>&#x3b7;</italic>). This feature effectively reduces overfitting and might be better analyzed using machine learning methods. Incorporating the more realistic mechanisms discussed above would yield additional effective parameters allowing the model to more accurately reproduce the measured quantities; nonetheless, intermittent differentiation of HSCs remains the key proposed mechanism for understanding intersample clone abundance variations.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1182/blood-2016-07-728691">https://doi.org/10.1182/blood-2016-07-728691</ext-link>.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>TC, YP, and MD&#x2019;O developed and analyzed the model and wrote the manuscript. YP organized the data, performed numerical analyses, and data fitting. MT contributed to the analysis of the model and helped shape the stochastic simulation approach. TS provided insight on stem cell biology.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported by grants from the NIH through grant R01HL146552 (TC) and the Army Research Office through grant W911NF-18-1-0345 (MD&#x2019;O) and DMS-1814090 (MD&#x2019;O).</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fsysb.2023.893366/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fsysb.2023.893366/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>Certain lineages such as T cells can intermittently proliferate, e.g., upon antigen activation, but we neglect this and use small effective death rates <italic>&#x3bc;</italic>
<sub>m</sub> for such cell types.</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abbuehl</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Tatarova</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Held</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huelsken</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Long-term engraftment of primary bone marrow stromal cells repairs niche damage and improves hematopoietic stem cell transplantation</article-title>. <source>Cell. Stem Cell.</source> <volume>21</volume>, <fpage>241</fpage>&#x2013;<lpage>255</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2017.07.004</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abkowitz</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Catlin</surname>
<given-names>S. N.</given-names>
</name>
<name>
<surname>Guttorp</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Evidence that hematopoiesis may be a stochastic process <italic>in vivo</italic>
</article-title>. <source>Nat. Med.</source> <volume>2</volume>, <fpage>190</fpage>&#x2013;<lpage>197</lpage>. <pub-id pub-id-type="doi">10.1038/nm0296-190</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Attar</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Changes in the cell surface markers during normal hematopoiesis: A guide to cell isolation</article-title>. <source>Glob. J. Hematol. Blood Transfus.</source> <volume>1</volume>, <fpage>20</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.15379/2408-9877.2014.01.01.4</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Biasco</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Pellin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Scala</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dionisio</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Basso-Ricci</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Leonardelli</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>
<italic>In vivo</italic> tracking of human hematopoiesis reveals patterns of clonal dynamics during early and steady-state reconstitution phases</article-title>. <source>Cell. Stem Cell.</source> <volume>19</volume>, <fpage>107</fpage>&#x2013;<lpage>119</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2016.04.016</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bortz</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Kalos</surname>
<given-names>M. H.</given-names>
</name>
<name>
<surname>Lebowitz</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>1975</year>). <article-title>A new algorithm for Monte Carlo simulation of ising spin systems</article-title>. <source>J. Comput. Phys.</source> <volume>17</volume>, <fpage>10</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1016/0021-9991(75)90060-1</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Busch</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Klapproth</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Barile</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Flossdorf</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Holland-Letz</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Schlenner</surname>
<given-names>S. M.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Fundamental properties of unperturbed haematopoiesis from stem cells <italic>in vivo</italic>
</article-title>. <source>Nature</source> <volume>518</volume>, <fpage>542</fpage>&#x2013;<lpage>546</lpage>. <pub-id pub-id-type="doi">10.1038/nature14242</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bystrykh</surname>
<given-names>L. V.</given-names>
</name>
<name>
<surname>Verovskaya</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Zwart</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Broekhuis</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>de Haan</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Counting stem cells: Methodological constraints</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>567</fpage>&#x2013;<lpage>574</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2043</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Catlin</surname>
<given-names>S. N.</given-names>
</name>
<name>
<surname>Busque</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gale</surname>
<given-names>R. E.</given-names>
</name>
<name>
<surname>Guttorp</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Abkowitz</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The replication rate of human hematopoietic stem cells <italic>in vivo</italic>
</article-title>. <source>Blood</source> <volume>117</volume>, <fpage>4460</fpage>&#x2013;<lpage>4466</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2010-08-303537</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Challen</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Goodell</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Clonal hematopoiesis: Mechanisms driving dominance of stem cell clones</article-title>. <source>Blood</source> <volume>136</volume>, <fpage>1590</fpage>&#x2013;<lpage>1598</lpage>. <pub-id pub-id-type="doi">10.1182/blood.2020006510</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chao</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Nonparametric lower bounds for species richness and shared species richness under sampling without replacement</article-title>. <source>Biometrics</source> <volume>68</volume>, <fpage>912</fpage>&#x2013;<lpage>921</lpage>. <pub-id pub-id-type="doi">10.1111/j.1541-0420.2011.01739.x</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Colijn</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Mackey</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>A mathematical model of hematopoiesis: II. Cyclical neutropenia</article-title>. <source>J. Theor. Biol.</source> <volume>237</volume>, <fpage>133</fpage>&#x2013;<lpage>146</lpage>. <pub-id pub-id-type="doi">10.1016/j.jtbi.2005.03.034</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Copley</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Beer</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Eaves</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Hematopoietic stem cell heterogeneity takes center stage</article-title>. <source>Cell. Stem Cell.</source> <volume>10</volume>, <fpage>690</fpage>&#x2013;<lpage>697</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2012.05.006</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cordes</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Dunbar</surname>
<given-names>C. E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Clonal tracking of haematopoietic cells: Insights and clinical implications</article-title>. <source>J. Haematol.</source> <volume>192</volume>, <fpage>819</fpage>&#x2013;<lpage>831</lpage>. <pub-id pub-id-type="doi">10.1111/bjh.17175</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Corso</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Varettoni</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mangiacavalli</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zappasodi</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Klersy</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Rusconi</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Bone marrow CD34&#x2b; cell count is predictive for adequate peripheral progenitor cell collection</article-title>. <source>Leukemia Res.</source> <volume>29</volume>, <fpage>159</fpage>&#x2013;<lpage>163</lpage>. <pub-id pub-id-type="doi">10.1016/j.leukres.2004.05.018</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Haan</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Lazare</surname>
<given-names>S. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Aging of hematopoietic stem cells</article-title>. <source>Blood</source> <volume>131</volume>, <fpage>479</fpage>&#x2013;<lpage>487</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2017-06-746412</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Souza</surname>
<given-names>D. C.</given-names>
</name>
<name>
<surname>Humphries</surname>
<given-names>A. R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Dynamics of a mathematical hematopoietic stem-cell population model</article-title>. <source>SIAM J. Appl. Dyn. Syst.</source> <volume>18</volume>, <fpage>808</fpage>&#x2013;<lpage>852</lpage>. <pub-id pub-id-type="doi">10.1137/18m1165086</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doulatov</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Notta</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Laurenti</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Dick</surname>
<given-names>J. E.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Hematopoiesis: A human perspective</article-title>. <source>Cell. Stem Cell.</source> <volume>10</volume>, <fpage>120</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2012.01.006</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Espinoza</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cordes</surname>
<given-names>S. F.</given-names>
</name>
<name>
<surname>Truitt</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Calvo</surname>
<given-names>K. R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Aberrant clonal hematopoiesis following lentiviral vector transduction of HSPCs in a rhesus macaque</article-title>. <source>Mol. Ther.</source> <volume>27</volume>, <fpage>1074</fpage>&#x2013;<lpage>1086</lpage>. <pub-id pub-id-type="doi">10.1016/j.ymthe.2019.04.003</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fliedner</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Research within the field of blood and marrow transplantation nursing: How can it contribute to higher quality of care?</article-title> <source>Int. J. Hematol.</source> <volume>76</volume>, <fpage>289</fpage>&#x2013;<lpage>291</lpage>. <pub-id pub-id-type="doi">10.1007/BF03165135</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gillespie</surname>
<given-names>D. T.</given-names>
</name>
</person-group> (<year>1977</year>). <article-title>Exact stochastic simulation of coupled chemical reactions</article-title>. <source>J. Phys. Chem.</source> <volume>81</volume>, <fpage>2340</fpage>&#x2013;<lpage>2361</lpage>. <pub-id pub-id-type="doi">10.1021/j100540a008</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gillespie</surname>
<given-names>D. T.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Stochastic simulation of chemical kinetics</article-title>. <source>Annu. Rev. Phys. Chem.</source> <volume>58</volume>, <fpage>35</fpage>&#x2013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.physchem.58.032806.104637</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goyal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>I. S.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mechanisms of blood homeostasis: Lineage tracking and a neutral model of cell populations in rhesus macaques</article-title>. <source>BMC Biol.</source> <volume>13</volume>, <fpage>85</fpage>. <pub-id pub-id-type="doi">10.1186/s12915-015-0191-8</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grosselin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sii-Felice</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Payen</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Chretien</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Roux</surname>
<given-names>D. T. L.</given-names>
</name>
<name>
<surname>Leboulch</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Arrayed lentiviral barcoding for quantification analysis of hematopoietic dynamics</article-title>. <source>Stem Cells</source> <volume>31</volume>, <fpage>2162</fpage>&#x2013;<lpage>2171</lpage>. <pub-id pub-id-type="doi">10.1002/stem.1383</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>H&#xf6;fer</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Rodewald</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Output without input: The lifelong productivity of hematopoietic stem cells</article-title>. <source>Curr. Opin. Cell. Biol.</source> <volume>43</volume>, <fpage>69</fpage>&#x2013;<lpage>77</lpage>. <pub-id pub-id-type="doi">10.1016/j.ceb.2016.08.003</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Presson</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Metzger</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bonifacino</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sehl</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Dynamics of HSPC repopulation in nonhuman primates revealed by a decade-long clonal-tracking study</article-title>. <source>Cell. Stem Cell.</source> <volume>14</volume>, <fpage>473</fpage>&#x2013;<lpage>485</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2013.12.012</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Presson</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>An</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Mao</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Bonifacino</surname>
<given-names>A. C.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>High-throughput, sensitive quantification of repopulating hematopoietic stem cell clones</article-title>. <source>J. Virology</source> <volume>84</volume>, <fpage>11771</fpage>&#x2013;<lpage>11780</lpage>. <pub-id pub-id-type="doi">10.1128/JVI.01355-10</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klose</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Florian</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Gerbaulet</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Geiger</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Glauche</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Hematopoietic stem cell dynamics are regulated by progenitor demand: Lessons from a quantitative modeling approach</article-title>. <source>Stem Cells</source> <volume>37</volume>, <fpage>948</fpage>&#x2013;<lpage>957</lpage>. <pub-id pub-id-type="doi">10.1002/stem.3005</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koelle</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Espinoza</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Quantitative stability of hematopoietic stem and progenitor cell clonal output in rhesus macaques receiving transplants</article-title>. <source>Blood</source> <volume>129</volume>, <fpage>1448</fpage>&#x2013;<lpage>1457</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2016-07-728691</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolouri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Thorpe</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Slepcev</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Rohde</surname>
<given-names>G. K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Optimal mass transport: Signal processing and machine-learning applications</article-title>. <source>IEEE Signal Process. Mag.</source> <volume>34</volume>, <fpage>43</fpage>&#x2013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1109/MSP.2017.2695801</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee-Six</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Friesgaard-Obro</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Shepherd</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Grossmann</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dawson</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Belmonte</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Population dynamics of normal human blood inferred from somatic mutations</article-title>. <source>Nature</source> <volume>561</volume>, <fpage>473</fpage>&#x2013;<lpage>478</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-018-0497-0</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lewkiewicz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chuang</surname>
<given-names>Y. L.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2019a</year>). <article-title>A mathematical model of the effects of aging on naive T cell populations and diversity</article-title>. <source>Bull. Math. Biol.</source> <volume>81</volume>, <fpage>2783</fpage>&#x2013;<lpage>2817</lpage>. <pub-id pub-id-type="doi">10.1007/s11538-019-00630-z</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lewkiewicz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chuang</surname>
<given-names>Y. L.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2019b</year>). <article-title>Dynamics of T cell receptor distributions following acute thymic atrophy and resumption</article-title>. <source>Math. Biosci. Eng.</source> <volume>17</volume>, <fpage>28</fpage>&#x2013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.3934/mbe.2020002</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lyne</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Kent</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Laurenti</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Cornils</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Glauche</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Perie</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A track of the clones: New developments in cellular barcoding</article-title>. <source>Exp. Hematol.</source> <volume>68</volume>, <fpage>15</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1016/j.exphem.2018.11.005</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marciniak-Czochra</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Stiehl</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wagner</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Modeling of replicative senescence in hematopoietic development</article-title>. <source>Aging (Albany NY)</source> <volume>1</volume>, <fpage>723</fpage>&#x2013;<lpage>732</lpage>. <pub-id pub-id-type="doi">10.18632/aging.100072</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mayle</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jeong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Goodell</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Flow cytometry analysis of murine hematopoietic stem cells</article-title>. <source>Nature</source> <volume>518</volume>, <fpage>542</fpage>&#x2013;<lpage>546</lpage>.</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mendelson</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Frenette</surname>
<given-names>P. S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Hematopoietic stem cell niche maintenance during homeostasis and regeneration</article-title>. <source>Nat. Med.</source> <volume>20</volume>, <fpage>833</fpage>&#x2013;<lpage>846</lpage>. <pub-id pub-id-type="doi">10.1038/nm.3647</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muller-Sieburg</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Sieburg</surname>
<given-names>H. B.</given-names>
</name>
<name>
<surname>Bernitz</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Cattarossi</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Stem cell heterogeneity: Implications for aging and regenerative medicine</article-title>. <source>Blood</source> <volume>119</volume>, <fpage>3900</fpage>&#x2013;<lpage>3907</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2011-12-376749</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parmentier</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kramer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Weller</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schuler</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Ordemann</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Rall</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Reevaluation of reference values for bone marrow differential counts in 236 healthy bone marrow donors</article-title>. <source>Ann. Hematol.</source> <volume>99</volume>, <fpage>2723</fpage>&#x2013;<lpage>2729</lpage>. <pub-id pub-id-type="doi">10.1007/s00277-020-04255-4</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parzen</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>1962</year>). <article-title>On estimation of a probability density function and mode</article-title>. <source>Ann. Math. Statistics</source> <volume>33</volume>, <fpage>1065</fpage>&#x2013;<lpage>1076</lpage>. <pub-id pub-id-type="doi">10.1214/aoms/1177704472</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peixoto</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dingli</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pacheco</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Modelling hematopoiesis in health and disease</article-title>. <source>Math. Comput. Model.</source> <volume>53</volume>, <fpage>1546</fpage>&#x2013;<lpage>1557</lpage>. <pub-id pub-id-type="doi">10.1016/j.mcm.2010.04.013</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Radtke</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Colonna</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Perez</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Hoffman</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kean</surname>
<given-names>L. S.</given-names>
</name>
<name>
<surname>Kiem</surname>
<given-names>H. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Isolation of a highly purified HSC-enriched CD34<sup>&#x002B;</sup>CD90<sup>&#x002B;</sup>CD45RA<sup>&#x2212;</sup> cell subset for allogeneic transplantation in the nonhuman primate large-animal model</article-title>. <source>Transplant. Direct</source> <volume>6</volume>, <fpage>e579</fpage>. <pub-id pub-id-type="doi">10.1097/TXD.0000000000001029</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rosenblatt</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1956</year>). <article-title>Remarks on some nonparametric estimates of a density function</article-title>. <source>Ann. Math. Statistics</source> <volume>27</volume>, <fpage>832</fpage>&#x2013;<lpage>837</lpage>. <pub-id pub-id-type="doi">10.1214/aoms/1177728190</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seita</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Weissman</surname>
<given-names>I. L.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Hematopoietic stem cell: Self-renewal versus differentiation</article-title>. <source>Wiley Interdiscip. Rev. Syst. Biol. Med.</source> <volume>2</volume>, <fpage>640</fpage>&#x2013;<lpage>653</lpage>. <pub-id pub-id-type="doi">10.1002/wsbm.86</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shepherd</surname>
<given-names>B. E.</given-names>
</name>
<name>
<surname>Kiem</surname>
<given-names>H. P.</given-names>
</name>
<name>
<surname>Lansdorp</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Dunbar</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Aubert</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>LaRochelle</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2007</year>). <article-title>Hematopoietic stem-cell behavior in nonhuman primates</article-title>. <source>Blood</source> <volume>110</volume>, <fpage>1806</fpage>&#x2013;<lpage>1813</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2007-02-075382</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Silverman</surname>
<given-names>B. W.</given-names>
</name>
</person-group> (<year>1986</year>). <source>Density estimation for statistics and data analysis</source>. <publisher-loc>London</publisher-loc>: <publisher-name>Chapman &#x26; Hall</publisher-name>.</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stiehl</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Marciniak-Czochra</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Characterization of stem cells using mathematical models of multistage cell lineages</article-title>. <source>Math. Comput. Model.</source> <volume>53</volume>, <fpage>1505</fpage>&#x2013;<lpage>1517</lpage>. <pub-id pub-id-type="doi">10.1016/j.mcm.2010.03.057</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ramos</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chapman</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Johnnidis</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Le</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ho</surname>
<given-names>Y. J.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Clonal dynamics of native haematopoiesis</article-title>. <source>Nature</source> <volume>514</volume>, <fpage>322</fpage>&#x2013;<lpage>327</lpage>. <pub-id pub-id-type="doi">10.1038/nature13824</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Komarova</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Stochastic modeling of stem-cell dynamics with control</article-title>. <source>Math. Biosci.</source> <volume>240</volume>, <fpage>231</fpage>&#x2013;<lpage>240</lpage>. <pub-id pub-id-type="doi">10.1016/j.mbs.2012.08.004</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sz&#xe9;kely</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Burrage</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Mangel</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bonsall</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Stochastic dynamics of interacting haematopoietic stem cell niche lineages</article-title>. <source>PLoS Comput. Biol.</source> <volume>10</volume>, <fpage>e1003794</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1003794</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verovskaya</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Broekhuis</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Zwart</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ritsema</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>van Os</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>de Haan</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Heterogeneity of young and aged murine hematopoietic stem cells revealed by quantitative clonal analysis using cellular barcoding</article-title>. <source>Blood</source> <volume>122</volume>, <fpage>523</fpage>&#x2013;<lpage>532</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2013-01-481135</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Villani</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2009</year>). <source>Optimal transport, old and new</source>. <publisher-loc>Berlin Heidelberg</publisher-loc>: <publisher-name>Springer-Verlag</publisher-name>.</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Koelle</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jares</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Clonal tracking of rhesus macaque hematopoiesis highlights a distinct lineage origin for natural killer cells</article-title>. <source>Cell. Stem Cell.</source> <volume>14</volume>, <fpage>486</fpage>&#x2013;<lpage>499</lpage>. <pub-id pub-id-type="doi">10.1016/j.stem.2014.01.020</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Guttorp</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Abkowitz</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>2018a</year>). <article-title>Visualizing hematopoiesis as a stochastic process</article-title>. <source>Blood Adv.</source> <volume>1</volume>, <fpage>2637</fpage>&#x2013;<lpage>2645</lpage>. <pub-id pub-id-type="doi">10.1182/bloodadvances.2018023705</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>B&#xf6;ttcher</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Diversity in biology: Definitions, quantification and models</article-title>. <source>Phys. Biol.</source> <volume>17</volume>, <fpage>031001</fpage>. <pub-id pub-id-type="doi">10.1088/1478-3975/ab6754</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>I. S. Y.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2018b</year>). <article-title>Modeling large fluctuations of thousands of clones during hematopoiesis: The role of stem cell self-renewal and bursty progenitor dynamics in rhesus macaque</article-title>. <source>PLoS Comput. Biol.</source> <volume>14</volume>, <fpage>e1006489</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1006489</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yeh</surname>
<given-names>Y. H. J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Razmi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ho</surname>
<given-names>Y. C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The clonal expansion dynamics of the HIV-1 reservoir: Mechanisms of integration site-dependent proliferation and HIV-1 persistence</article-title>. <source>Viruses</source> <volume>13</volume>, <fpage>1858</fpage>. <pub-id pub-id-type="doi">10.3390/v13091858</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yuan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Research on K-value selection method of K-means clustering algorithm</article-title>. <source>J</source> <volume>2</volume>, <fpage>226</fpage>&#x2013;<lpage>235</lpage>. <pub-id pub-id-type="doi">10.3390/j2020016</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>