<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">762202</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2022.762202</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Genetic Diversity and Population Structure of Doum Palm (<italic>Hyphaene compressa</italic>) Using Genotyping by Sequencing</article-title>
<alt-title alt-title-type="left-running-head">Omire et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Genetic Diversity of <italic>H. compressa</italic>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Omire</surname>
<given-names>Agnes</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1315889/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Neondo</surname>
<given-names>Johnstone</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1560360/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Budambula</surname>
<given-names>Nancy L. M.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1484339/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wangai</surname>
<given-names>Laura</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ogada</surname>
<given-names>Stephen</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Mweu</surname>
<given-names>Cecilia</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Botany</institution>, <institution>School of Biological Sciences</institution>, <institution>Jomo Kenyatta University of Agriculture and Technology</institution>, <addr-line>Nairobi</addr-line>, <country>Kenya</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Institute for Biotechnology Research (IBR)</institution>, <institution>Jomo Kenyatta University of Agriculture and Technology</institution>, <addr-line>Nairobi</addr-line>, <country>Kenya</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Biological Sciences</institution>, <institution>School of Pure and Applied Sciences</institution>, <institution>University of Embu</institution>, <addr-line>Embu</addr-line>, <country>Kenya</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Biomedical Sciences</institution>, <institution>School of Health Sciences</institution>, <institution>Kirinyaga University</institution>, <addr-line>Kerugoya</addr-line>, <country>Kenya</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/99251/overview">Rana Dajani</ext-link>, Hashemite University, Jordan</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1062276/overview">Lizandra Jaqueline Robe</ext-link>, Federal University of Santa Maria, Brazil</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1521054/overview">Mukesh Choudhary</ext-link>, ICAR-Indian Institute of Maize Research, India</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1521687/overview">Amol N. Nankar</ext-link>, Center of Plant Systems Biology and Biotechnology, Bulgaria</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/419149/overview">Aleksandra Dimitrijevic</ext-link>, Institute of Field and Vegetable Crops, Serbia</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Cecilia Mweu, <email>cmweu@jkuat.ac.ke</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Evolutionary and Population Genetics, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>02</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>762202</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>08</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>01</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Omire, Neondo, Budambula, Wangai, Ogada and Mweu.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Omire, Neondo, Budambula, Wangai, Ogada and Mweu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Doum palm (<italic>Hyphaene compressa</italic>) is a perennial economic plant primarily growing in Kenya&#x2019;s Arid and Semi-Arid Lands (ASALs). It is heavily relied upon for food, animal feed, construction materials and medicine, making it an ideal plant for resource sustainability. However, the limited information on its genetic resources has hindered its breeding and conservation studies. This study used the genotyping by sequencing approach to identify Single Nucleotide Polymorphisms. These SNPs were further used to assess the genetic diversity and population structure of 96&#x20;<italic>H. compressa</italic> accessions from Coastal, Northern and Eastern ASAL regions of Kenya using two approaches; reference-based and <italic>de novo</italic>-based assemblies. STRUCTURE analysis grouped the sampled accessions into two genetic clusters (Cluster 1 and Cluster 2). Cluster 1 included accessions from the Northern region, whereas Cluster 2 included all accessions from Eastern and Coastal regions. Accessions from Kwale (Coastal) had mixed ancestry from both Cluster 1 and Cluster 2. These STRUCTURE findings were further supported by principal components analysis, discriminant analysis of principal components and phylogenetic analysis. Analysis of molecular variance indicated greater genetic variation within populations (92.7%) than among populations (7.3%). An overall F<sub>ST</sub> of 0.074 was observed, signifying moderate genetic differentiation among populations. The results of this study will provide information useful in breeding, marker-assisted selection and conservation management of <italic>H. compressa.</italic>
</p>
</abstract>
<kwd-group>
<kwd>genetic diversity</kwd>
<kwd>GBS</kwd>
<kwd>single nucleotide polymorphisms</kwd>
<kwd>population structure</kwd>
<kwd>
<italic>Hyphaene compressa</italic>
</kwd>
<kwd>doum palm</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>
<italic>Hyphaene compressa</italic> H. Wendl., also known as the East African doum palm, is a member of the Arecaceae family. It is integral in the agroforestry system of coastal and riverine parts of Africa (<xref ref-type="bibr" rid="B1">Amwatta, 2004</xref>; <xref ref-type="bibr" rid="B36">Uhl and Moore, 2019</xref>). The doum palm also grows in the arid and semi-arid lands (ASALs) of Kenya (<xref ref-type="bibr" rid="B34">Maundu and Tengnas, 2005</xref>). It is a valuable source of food, animal feed, medicine for headaches and worms, as well as non-wood products for construction and weaving. Thus, it is a substantial income-generating plant, particularly for women in ASALs who derive their livelihoods from the sale of woven leaf products (<xref ref-type="bibr" rid="B1">Amwatta, 2004</xref>; <xref ref-type="bibr" rid="B34">Maundu and Tengnas, 2005</xref>; <xref ref-type="bibr" rid="B40">Omire et&#x20;al., 2020a</xref>). The ability to withstand waterlogging, drought and salinity makes the doum palm a reliable economic plant with ability to avert natural calamities including drought in such areas (<xref ref-type="bibr" rid="B1">Amwatta, 2004</xref>; <xref ref-type="bibr" rid="B40">Omire et&#x20;al., 2020a</xref>).</p>
<p>In Kenyan ASALs, non-timber products are restricted to a few plant species such as <italic>H. compressa</italic>, subsequently threatening its existence. Thus, <italic>H. compressa</italic> is classified as a threatened and a national priority species in the ASALs of Kenya with a high potential for genetic erosion due to overexploitation by the rural communities (<xref ref-type="bibr" rid="B29">Kigomo, 2001</xref>). However, the International Union for Conservation of Nature (IUCN) considers it a species of least concern with an unknown population trend due to its wide geographical distribution throughout East Africa (<xref ref-type="bibr" rid="B8">Cosiaux et&#x20;al., 2017</xref>). Whereas species might exist as large populations they could be regionally threatened. <italic>Hyphaene. compressa</italic> resources are known to be strained and overexploited in the Eastern part of Kenya (<xref ref-type="bibr" rid="B40">Omire et&#x20;al., 2020a</xref>). Despite this knowledge on the status, there are no known interventions to reverse the current trend (<xref ref-type="bibr" rid="B29">Kigomo, 2001</xref>). This could exacerbate the risk of extinction of such species (<xref ref-type="bibr" rid="B9">Cosiaux et&#x20;al., 2018</xref>).</p>
<p>Threats to <italic>H. compressa</italic> include human interference as well as biotic and abiotic stress (<xref ref-type="bibr" rid="B40">Omire et&#x20;al., 2020a</xref>). Overgrazing by pastoralist communities, particularly along the riverine areas, is a significant threat to this palm since livestock graze and browse on <italic>H. compressa</italic> (<xref ref-type="bibr" rid="B29">Kigomo, 2001</xref>). The strain on <italic>H. compressa</italic> resources has been aggravated by the sedentarization of the nomadic pastoralists (<xref ref-type="bibr" rid="B1">Amwatta, 2004</xref>). Sedentarization leads to the assemblage of pastoralists around limited resources and ultimately to land degradation (<xref ref-type="bibr" rid="B25">Johnson, 1993</xref>). Another source of pressure on <italic>H. compressa</italic> is overharvesting and harvesting of immature sword leaves. These leaf pressures have been shown to cause dwarfing in a sister palm, <italic>Hyphaene thebaica</italic> (<xref ref-type="bibr" rid="B27">Kahn and Luxereau, 2008</xref>). Other selection pressures on <italic>H. compressa</italic> include logging, burning and wine tapping from the apical meristem. These pressures collectively lead to genetic drift through the loss of specific genotypes, which might eventually affect the <italic>H. compressa</italic> gene pool (<xref ref-type="bibr" rid="B29">Kigomo, 2001</xref>).</p>
<p>There is scanty information on the genetic diversity of doum palm which limits access to its important traits and thus hinders its improvement. Previous diversity studies on <italic>H. compressa</italic> focussed on accessing the variability of its morphological traits (<xref ref-type="bibr" rid="B41">Omire et&#x20;al., 2020b</xref>). The study identified five morphotypes with accessions from the Kenyan Coastal area being the most heterogeneous. However, this cannot be used to adequately delineate the doum palm since morphological markers may also be affected by the environment, are limited in number, unstable, slow and some appear late in plant development making them difficult to score (<xref ref-type="bibr" rid="B2">Andersen and Lubberstedt, 2003</xref>; <xref ref-type="bibr" rid="B35">Mokhtar et&#x20;al., 2016</xref>). Furthermore, using a single marker like morphology is not adequate to assess diversity (<xref ref-type="bibr" rid="B28">Khan et&#x20;al., 2012</xref>). Overall, genetic markers are superior to morphological markers (<xref ref-type="bibr" rid="B20">Ganie et&#x20;al., 2015</xref>) and may or may not agree with phenotypic expression of a genomic&#x20;trait.</p>
<p>For non-model plants like doum palm with no reference genome, sequencing the whole genome to mine the SNPs would be ideal. There are other methods like Genotyping by Sequencing (GBS) that are able to acquire in depth data on parts of the genome and are as effective but less costly compared to whole genome sequencing (<xref ref-type="bibr" rid="B50">Wallace and Mitchell, 2017</xref>). GBS is a method that provides reduced libraries for Illumina next generation sequencing (NGS) by targeting the subsets with restriction enzymes followed by ligation of DNA barcoded adapters (<xref ref-type="bibr" rid="B15">Elshire et&#x20;al., 2011</xref>). PCR amplification and high throughput NGS of the genomic subsets on a single lane of flow cells is then done (<xref ref-type="bibr" rid="B15">Elshire et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B22">He et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B6">Burghardt, et&#x20;al., 2017</xref>). GBS is simple, rapid and highly reproducible (<xref ref-type="bibr" rid="B11">Davey et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B6">Burghardt et&#x20;al., 2017</xref>). These features make GBS highly attractive for several genetic applications, including genetic diversity, phylogeny, genome-wide association studies, association maps, genomic selection, physical and linkage maps (<xref ref-type="bibr" rid="B6">Burghardt et&#x20;al., 2017</xref>). GBS is an ideal tool for genetic diversity studies with the advantage of being able to identify SNPs, insertions, deletions and microsatellites (<xref ref-type="bibr" rid="B15">Elshire et&#x20;al., 2011</xref>) even in non-model organisms with no prior genome information (<xref ref-type="bibr" rid="B48">Taranto et&#x20;al., 2016</xref>). Diversity studies can be combined with phylogenetic studies to provide more information on the origin and domestication of the germplasm for conservation purposes (<xref ref-type="bibr" rid="B6">Burghardt et&#x20;al., 2017</xref>). Earlier studies have alluded to the fact that the evolution of a population is guided by its local interactions in the environment (<xref ref-type="bibr" rid="B31">Klimova et&#x20;al., 2018</xref>). Gene flow has a tendency to homogenize populations and reduce genetic variability (<xref ref-type="bibr" rid="B5">Brunet et&#x20;al., 2012</xref>). However, there needs to be enough gene pool on which selection can take place for effective speciation.</p>
<p>Thus far, the genetic diversity of <italic>H. compressa</italic> remains unknown despite its economic and subsistence role in Africa&#x2019;s ASALs. There were no <italic>H. compressa</italic> or other palms in the genus <italic>Hyphaene</italic> with assembled genomes at the time of this study. Due to the scanty genetic information coupled with the pressure already demonstrated on this palm, there is a need to decipher its genetics. This study assumes that the different accessions of <italic>H. compressa</italic> growing in Kenya are diverse. The present study aimed to identify genome-wide SNPs, assess the level of genetic diversity, determine the population structure and estimate gene flow between <italic>H. compressa</italic> accessions collected from four ASAL regions of Kenya using GBS approach. The data obtained from this study will be an important genomic resource that will be used to inform the conservation, management, breeding and propagation of <italic>H. compressa</italic>.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<sec id="s2-1">
<title>
<italic>H. compressa</italic> Plant Materials</title>
<p>A total of 96&#x20;<italic>H. compressa</italic> accessions collected between February and August of 2018 were used in this study. These accessions were collected from different ASALs of Kenya; Eastern (Tharaka Nithi County), Northern (Turkana County), Coastal (Kwale and Tana River counties) as shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> and <xref ref-type="sec" rid="s11">Supplementary Table S1</xref>. Leaf samples of the selected plants were collected using sterile blades and placed in sterile tubes containing 10&#xa0;g of silica gel for DNA extraction. Accessions within approximately the same age group and located as distantly as possible from each other were sampled.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Map illustrating <italic>H. compressa</italic> sampling points along the Turkana and Tana basins. Map was created using ArcMap version 10.8.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>Preparation of Libraries and Sequencing</title>
<p>Genomic DNA was isolated from <italic>H. compressa</italic> leaves using DNeasy<sup>&#xae;</sup> Plant Mini Kit (Qiagen, Germany). The purity and quantity of the DNA were determined using Qubit Fluorometer (Invitrogen) or microplate reader (DR-200B, Diatek), while a 1% agarose gel was used to confirm its integrity. Commercial GBS sequencing was done at Beijing Genomics Institute (BGI, China). A total of 96 samples; Tharaka (27), Turkana (21), Tana River (20) and Kwale (28), passed the sample quality check (QC) and proceeded to library preparation.</p>
<p>Library preparation was done following the method previously described by <xref ref-type="bibr" rid="B15">Elshire et&#x20;al. (2011)</xref>. Essentially, the DNA samples were barcoded and adapter pairs plated. The restriction enzyme ApeK1 (GCWGC as the recognition site) was used, followed by adapter ligation to the DNA fragments. This was followed by pooling and purification. PCR was then performed using primers with adapter binding sites. Sample clean-up of the PCR products, fragment size selection and sequencing on a Hiseq X10 platform as paired-end 100&#xa0;bp (Illumina PE 100) was done. Adapter sequences, sequences with low-quality reads, and those lacking barcodes were discarded from the raw&#x20;reads.</p>
<p>The data was processed using the <italic>de_novo</italic> and reference-based approaches. In the <italic>de_novo</italic> assembly, ipyrad version 0.9.74 (<xref ref-type="bibr" rid="B13">Eaton and Overcast, 2020</xref>) was used to assemble sequences without a reference genome using the following parameters; assembly method <italic>de_novo</italic>, datatype pairgbs, mindepth_statistical 6, mindepth_majrule 6, min_samples_locus 4 and other parameters set to default. In the reference-based approach, paired read ends were mapped to the <italic>Phoenix dactylifera</italic> (date palm) genome (<xref ref-type="bibr" rid="B21">Hazzouri et&#x20;al., 2019</xref>). A confamilial (same family) reference genome was used for SNP calling (<xref ref-type="bibr" rid="B19">Galla et&#x20;al., 2019</xref>) since <italic>H. compressa</italic> had no assembled genome at the time of this study. These two palms belong to the same subfamily Coryphoideae. <italic>Phoenix dactylifera</italic> genome was the only available genome in this subfamily. Alignment of the sequence reads against the date palm reference genome was done using the Burrows-Wheeler Aligner (BWA) using the parameters &#x2018;mem&#x2013;t4 &#x2013;k32 &#x2013;M&#x2019; (<xref ref-type="bibr" rid="B32">Li and Durbin, 2009</xref>). SNP filtering was done using VCFtools version 0.1.16 (<xref ref-type="bibr" rid="B10">Danecek et&#x20;al., 2011</xref>) with the following parameters; biallelic SNPs, min meanDp 2, removing indels, Minor Allele Frequency (MAF) 0.05, minDP 2, max-missing&#x20;0.8.</p>
</sec>
<sec id="s2-3">
<title>Data Analysis</title>
<p>The quality of the filtered VCF files were assessed using the R package tidyverse (<xref ref-type="bibr" rid="B51">Wickham et&#x20;al., 2019</xref>). The read depth per site, heterozygosity, read depth per individual and read quality were determined.</p>
</sec>
<sec id="s2-4">
<title>Population Structure Analysis and Genetic Diversity</title>
<p>Population structure was determined by STRUCTURE software version 2.3.4 using the admixture model (<xref ref-type="bibr" rid="B45">Pritchard et&#x20;al., 2000</xref>). Populations of <italic>K</italic> (<italic>K</italic>&#x20;&#x3d; 1&#x2013;10) were run with three replications using a burn-in of 100, 000 generations and 100, 000 Markov Chain Monte Carlo (MCMC) iterations. The software STRUCTURE HARVESTER web Version 0.6.94 (<xref ref-type="bibr" rid="B12">Earl and VonHoldt, 2012</xref>) available at <ext-link ext-link-type="uri" xlink:href="http://taylor0.biology.ucla.edu/structureHarvester/">http://taylor0.biology.ucla.edu/structureHarvester/</ext-link> was used to determine the optimal K value using the <italic>adhoc delta K</italic> (<xref ref-type="bibr" rid="B16">Evanno et&#x20;al., 2005</xref>). To plot the structure results, the POPHELPER version 2.3.1 package in R was used (<xref ref-type="bibr" rid="B18">Francis, 2017</xref>). Genotypes that had &#x2265;0.80 membership proportion and those with less than this value were assigned to pure and admixture populations, respectively (<xref ref-type="bibr" rid="B39">Nkhoma et&#x20;al., 2020</xref>).</p>
<p>Discriminant Analysis of Principal Components (DAPC) was also used to evaluate the population structure of <italic>H. compressa</italic> using the package adegenet version 2.1.3 (<xref ref-type="bibr" rid="B26">Jombart, 2008</xref>) in R. To visualize each sample&#x2019;s assignment, a composite stacked bar plot illustrating the probability of population membership on the <italic>Y</italic>-axis was generated. Principal component analysis (PCA) was constructed using the R software package SNPrelate (<xref ref-type="bibr" rid="B53">Zheng et&#x20;al., 2012</xref>) to determine the genetic relationships of <italic>H. compressa</italic> accessions.</p>
<p>Observed heterozygosity (<italic>H</italic>
<sub>
<italic>o</italic>
</sub>), Expected heterozygosity (<italic>H</italic>
<sub>
<italic>e</italic>
</sub>) fixation index (<italic>F</italic>
<sub>
<italic>ST</italic>
</sub>), inbreeding coefficient (<italic>F</italic>
<sub>
<italic>IS</italic>
</sub>), Analysis of Molecular Variance (AMOVA) and pairwise <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> values of the population were determined using Arlequin version 3.5.2.2 (<xref ref-type="bibr" rid="B17">Excoffier and Lischer, 2010</xref>).</p>
</sec>
<sec id="s2-5">
<title>Phylogenetic Analysis</title>
<p>To construct a splitstree, the filtered VCF file was converted to a nexus file using vcf2phylip.py script (<xref ref-type="bibr" rid="B42">Ortiz, 2019</xref>). The nexus file was then used to generate an unrooted splitstree using the neighbor net method in SplitsTree software, version 4.17.0 (<xref ref-type="bibr" rid="B23">Huson and Bryant, 2006</xref>). An UPGMA distance tree was also constructed using R software to represent the genetic clustering of <italic>H. compressa</italic> accessions.</p>
</sec>
<sec id="s2-6">
<title>Migration Rates Between the Eastern and Coastal Populations Along the Tana Basin</title>
<p>To determine if the population structure observed along the Tana basin is influenced by seed dispersal along the river, gene flow was estimated using MIGRATE-n software version 3.6.11. A Bayesian inference strategy was used with constant mutation rates among all loci. Burn in was set at 5,000 iterations at each locus. Static heating at four different temperatures (1, 1.5, 3 and 6) was used to improve the MCMC searches. One gene flow model was designed with direct migration from Tharaka to Tana River and to Kwale. The drainage of the Tana basin was used to design this model. Turkana accessions were excluded from this model since structure analysis and PCA demonstrated little historical gene flow. To judge whether the runs converged on good answers, the histograms and the effective population sizes were checked.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>Paired-end sequencing of 96&#x20;<italic>H. compressa</italic> accessions yielded an average of 2.4 million reads per sample. The <italic>de_novo</italic>-based assembly using ipyrad software resulted in 3,941 raw loci. After filtering, a total of 2,096 SNPs with a mean depth of 35.7 (minimum 10.47, maximum 217.45) were retained using the <italic>de_novo</italic> based assembly. On the other hand, reference-based assembly using date palm as a reference genome resulted in 3.4 million loci. After filtering, 23,146 biallelic SNPs with a mean depth of 3.5 (minimum 2, maximum 47.49) were obtained using the reference-based assembly.</p>
<p>The SNPs obtained from <italic>de_novo</italic> based assembly had higher depths than the reference-based assembly, as shown by the individual sequencing depth and the mean depth. The proportion of missing data per accession was low for both the <italic>de_novo</italic> based and reference-based assemblies, with a maximum of 0.04 and 0.4, respectively. These VCF quality statistics, including the mean depth, observed heterozygosity, depth per individual and missing data per individual, are presented for both the <italic>de_novo</italic> based assembly (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>) and reference-based assembly (<xref ref-type="sec" rid="s11">Supplementary Figure&#x20;S2</xref>).</p>
<p>In the <italic>de_novo</italic> based assembly there were 1,283 (61.2%) transition SNPs and 813 (38.8%) transversion SNPs with the following types: A&#x2194;G type (651, 31.1%), C&#x2194;T type (632, 30.2%), A&#x2194;C type (192, 9.2%), A&#x2194;T type (174, 8.3%), C&#x2194;G type (222, 10.6%), G&#x2194;T type (225, 10.7%). There were 16,598 (70.9%) transition SNPs and 6,818 (29.1%) transversion SNPs with the following types: A&#x2194;G type (8,332, 35.6%), C&#x2194;T type (8,266, 35.3%), A&#x2194;C type (1,684, 7.2%), A&#x2194;T type (1825, 7.8%), C&#x2194;G type (1,636, 7%), and G&#x2194;T type (1,673, 7.1%) in the reference based assembly. The A&#x2194;G and C&#x2194;T transition SNPs had the highest counts for both assemblies (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). The transition SNPs versus transversion SNPs (Ts/Tv) ratio was 1.6 in the <italic>de_novo</italic> based assembly and 2.4 in the reference based assembly.</p>
<sec id="s3-1">
<title>Population Structure and Genetic Diversity</title>
<p>The optimal delta <italic>K</italic> was detected at <italic>K</italic>&#x20;&#x3d; 2 for both the <italic>de_novo</italic>-based assembly (<xref ref-type="sec" rid="s11">Supplementary Figure S3A</xref>) and reference-based assembly (<xref ref-type="sec" rid="s11">Supplementary Figure S3B</xref>), which inferred two genetic clusters of <italic>H</italic>. <italic>compressa</italic> (<xref ref-type="fig" rid="F2">Figure&#x20;2</xref>). Cluster 1 consisted of accessions from Turkana while cluster 2 consisted of accessions from Tharaka, Kwale and Tana River for both reference-based and <italic>de_novo</italic>-based assemblies. The accessions in Cluster 2 were sampled along the Tana basin and Kwale county as shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. The expected heterozygosity was lower for the <italic>de_novo</italic>-based assembly for cluster 1 (<italic>H</italic>
<sub>
<italic>e</italic>
</sub> &#x3d; 0.14) than cluster 2 (<italic>H</italic>
<sub>
<italic>e</italic>
</sub> &#x3d; 0.23). However, similar expected heterozygosity values were observed in the reference-based assembly for the two clusters (<italic>H</italic>
<sub>
<italic>e</italic>
</sub> &#x3d; 0.30). The genetic variation among populations in Cluster 1 was higher (<italic>de_novo F</italic>
<sub>
<italic>ST</italic>
</sub> &#x3d; 0.68 and reference-based <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> &#x3d; 0.17) than Cluster 2 (<italic>de_novo F</italic>
<sub>
<italic>ST</italic>
</sub> &#x3d; 0.3 and Reference-based <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> &#x3d; 0.06). A total of seven accessions from Kwale had admixed ancestry between Cluster 1 and Cluster 2 using the reference based assembly (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). There were no accessions in the <italic>de_novo</italic> assembly that had admixed ancestry values less than 88%. Structure results indicate that two gene pools best describe the population structure of <italic>H. compressa</italic>. However, a smaller peak observed at <italic>K</italic>&#x20;&#x3d; 3 might be another informative <italic>H. compressa</italic> population clustering (<xref ref-type="sec" rid="s11">Supplementary Figures S3, S4</xref>). Similar grouping of accessions using PCA for the <italic>de_novo</italic> and reference-based assemblies was observed in this study (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>). In both PCA plots, Tharaka Nithi, Kwale and Tana River accessions were closely clustered. PCA results were congruent with structure results.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>STRUCTURE bar plot of admixture model population assignment of 96&#x20;<italic>Hyphaene compressa</italic> accessions from Kenya based on 2,096 SNPs for the <italic>de_novo</italic> assembly <bold>(A)</bold> and 23,416 SNPs based on reference assembly <bold>(B)</bold>. The accessions are divided into two clusters. A combination of different colors represents admixed populations.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g002.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>STRUCTURE analysis of <italic>Hyphaene compressa</italic> from Kenya using reference-based and <italic>de_novo</italic> based assembly.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Assembly method</th>
<th align="center">Tharaka</th>
<th align="center">Tana river</th>
<th align="center">Kwale</th>
<th align="center">Turkana</th>
<th align="center">
<italic>He</italic>
</th>
<th align="center">
<italic>F</italic>
<sub>
<italic>ST</italic>
</sub>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<bold>Reference assembly</bold>
</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">&#xa0;&#xa0;Cluster 1</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="char" char=".">21</td>
<td align="char" char=".">0.29</td>
<td align="char" char=".">0.17</td>
</tr>
<tr>
<td align="left">&#xa0;&#xa0;Cluster 2</td>
<td align="char" char=".">27</td>
<td align="char" char=".">20</td>
<td align="char" char=".">21</td>
<td align="center">&#x2014;</td>
<td align="char" char=".">0.30</td>
<td align="char" char=".">0.06</td>
</tr>
<tr>
<td align="left">&#xa0;&#xa0;Admixed</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="char" char=".">7</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td colspan="7" align="left">
<bold>
<italic>De_novo</italic> assembly</bold>
</td>
</tr>
<tr>
<td align="left">&#xa0;&#xa0;Cluster 1</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="char" char=".">21</td>
<td align="char" char=".">0.14</td>
<td align="char" char=".">0.68</td>
</tr>
<tr>
<td align="left">&#xa0;&#xa0;Cluster 2</td>
<td align="char" char=".">27</td>
<td align="char" char=".">20</td>
<td align="char" char=".">28</td>
<td align="center">&#x2014;</td>
<td align="char" char=".">0.23</td>
<td align="char" char=".">0.30</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Principal Component Analysis (PCA) of <italic>Hyphaene compressa</italic> Kenyan accessions using 2096 SNPs obtained from the <italic>de novo</italic> assembly <bold>(A)</bold> and 23,416 SNPs obtained from the date palm reference based assembly <bold>(B)</bold>.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g003.tif"/>
</fig>
<p>DAPC analysis grouped <italic>H. compressa</italic> accessions into two clusters, with samples from Turkana falling to the right side of the DAPC vertical axis while the rest fell on the left side. There was moderate overlap between Kwale and Tana River accessions, while Tharaka accessions were distinctly separate (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>). DAPC analysis, composite plot and genetic diversity results are shown for only the reference based assembly SNP data since both assembly methods had shown congruent results in structure and PCA analysis. Population membership assignment using DAPC composite plot confirmed structure and PCA results. All the accessions along the Tana basin exhibited admixture with profoundly shared ancestry between Tharaka and Tana River. Kwale had the highest level of admixture (<xref ref-type="fig" rid="F5">Figure&#x20;5</xref>). DAPC results also confirmed no admixture between Turkana and accessions from the other regions.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Discriminant analysis of principal components (DAPC) of 96&#x20;<italic>Hyphaene compressa</italic> Kenyan accessions using 23,416 SNPs derived from GBS analysis using reference-based assembly. Inertia ellipses represent clusters in different colors. Each dot on the circle represents an accession.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Composite plot of <italic>Hyphaene compressa</italic> Kenyan accessions using reference-based assembly showing mixed ancestry between Kwale, Tana River and Tharaka. Each accession is a stacked bar chart with populations shown in colors.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g005.tif"/>
</fig>
<p>The four sampled regions of Tharaka, Tana River, Kwale and Turkana were assessed for the number of polymorphic sites, expected heterozygosity (<italic>H</italic>
<sub>
<italic>e</italic>
</sub>) or gene diversity, observed heterozygosity (<italic>H</italic>
<sub>
<italic>o)</italic>
</sub>, <italic>F</italic>
<sub>
<italic>IS</italic>
</sub> and <italic>F</italic>
<sub>
<italic>ST</italic>
</sub>
<italic>.</italic> The genetic variation among the <italic>H. compressa</italic> populations was moderate (<italic>F</italic>
<sub>
<italic>ST</italic>
</sub> &#x3d; 0.074, <italic>p</italic>&#x20;&#x2264; 0.001). The observed heterozygosity was higher than the expected heterozygosity in all the populations (<xref ref-type="table" rid="T2">Table&#x20;2</xref>). Negative <italic>F</italic>
<sub>
<italic>IS</italic>
</sub> values were obtained in all the populations, with Turkana having the lowest <italic>F</italic>
<sub>
<italic>IS</italic>
</sub> value (&#x2212;0.45). Kwale had the highest polymorphic sites (11,932) followed by Turkana (10,698) as shown in <xref ref-type="table" rid="T2">Table&#x20;2</xref>. Tana River had the lowest diversity (<italic>H</italic>
<sub>
<italic>e</italic>
</sub> &#x3d; 0.23, Polymorphic sites &#x3d; 8,370) of all the sampled regions (<xref ref-type="table" rid="T2">Table&#x20;2</xref>).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Mean values of genetic diversity indices determined for <italic>Hyphaene compressa</italic> accessions in the sampled populations.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Genetic index</th>
<th colspan="4" align="center">Region</th>
<th rowspan="2" align="center">Overall</th>
</tr>
<tr>
<th align="center">Tharaka</th>
<th align="center">Turkana</th>
<th align="center">Tana river</th>
<th align="center">Kwale</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Number of polymorphic sites</td>
<td align="char" char=".">9,277</td>
<td align="char" char=".">10,698</td>
<td align="char" char=".">8,370</td>
<td align="char" char=".">11,932</td>
<td align="char" char=".">23,416</td>
</tr>
<tr>
<td align="left">Observed heterozygosity (<italic>H</italic>
<sub>
<italic>o</italic>
</sub>)</td>
<td align="char" char=".">0.45</td>
<td align="char" char=".">0.47</td>
<td align="char" char=".">0.46</td>
<td align="char" char=".">0.44</td>
<td align="char" char=".">0.404</td>
</tr>
<tr>
<td align="left">Expected heterozygosity (<italic>H</italic>
<sub>
<italic>e</italic>
</sub>)</td>
<td align="char" char=".">0.32</td>
<td align="char" char=".">0.33</td>
<td align="char" char=".">0.23</td>
<td align="char" char=".">0.33</td>
<td align="char" char=".">0.31</td>
</tr>
<tr>
<td align="left">
<italic>F</italic>
<sub>
<italic>IS</italic>
</sub>
</td>
<td align="char" char=".">&#x2212;0.40</td>
<td align="char" char=".">&#x2212;0.45</td>
<td align="char" char=".">&#x2212;0.42</td>
<td align="char" char=".">&#x2212;0.37</td>
<td align="char" char=".">&#x2212;0.040</td>
</tr>
<tr>
<td align="left">
<italic>F</italic>
<sub>
<italic>ST</italic>
</sub>
</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="char" char=".">0.074</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Pairwise <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> values ranged between 0.025 (Tharaka and Tana River) and 0.105 (Turkana and Tana River). High pairwise <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> was recorded among Turkana and Tana River samples (<xref ref-type="table" rid="T3">Table&#x20;3</xref>). The lowest pairwise <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> was between Tharaka and Tana River, suggesting gene flow between the two regions. AMOVA showed that populations from each of the four regions of Turkana, Tharaka, Tana River and Kwale were slightly different from each other (<italic>p</italic>&#x20;&#x2264; 0.001, <xref ref-type="table" rid="T4">Table&#x20;4</xref>). The variation within populations was higher (92.7%) than among populations (7.3%).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Pairwise <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> values of Kenyan populations of <italic>Hyphaene compressa</italic>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Population</th>
<th align="center">Turkana</th>
<th align="center">Kwale</th>
<th align="center">Tharaka</th>
<th align="center">Tana river</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="5" align="left">Turkana</td>
</tr>
<tr>
<td align="left">Kwale</td>
<td align="char" char=".">0.07952</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Tharaka</td>
<td align="char" char=".">0.09795</td>
<td align="char" char=".">0.03629</td>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Tana River</td>
<td align="char" char=".">0.10541</td>
<td align="char" char=".">0.03329</td>
<td align="char" char=".">0.02505</td>
<td align="char" char=".">0.00</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Analysis of molecular variance (AMOVA) in genetic variation of <italic>Hyphaene compressa</italic> among and within populations of Kwale, Tharaka, Turkana and Tana River counties in Kenya.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Source of variation</th>
<th align="center">Sum&#x20;of squares</th>
<th align="center">Variance components</th>
<th align="center">Percentage variation</th>
<th align="center">
<italic>p</italic>-value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Among populations</td>
<td align="char" char=".">42728.129</td>
<td align="char" char=".">266.91865</td>
<td align="char" char=".">7.32597</td>
<td align="char" char=".">0.00</td>
</tr>
<tr>
<td align="left">Within populations</td>
<td align="char" char=".">558905.557</td>
<td align="char" char=".">3376.54026</td>
<td align="char" char=".">92.67403</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Total</td>
<td align="char" char=".">
<bold>601633.686</bold>
</td>
<td align="char" char=".">
<bold>3643.45891</bold>
</td>
<td align="char" char=".">
<bold>100</bold>
</td>
<td align="left"/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>Phylogenetic Analysis</title>
<p>The neighbor net network was able to group <italic>H. compressa</italic> accessions by region. Tana River, Kwale and Tharaka samples clustered closely compared to the Turkana, which was separated from the rest (<xref ref-type="fig" rid="F6">Figure&#x20;6</xref>). Samples from Turkana clustered together. Some of the Kwale accessions clustered closely with Tana River while other Kwale accessions clustered more closely with Tharaka accessions. The UPGMA phylogenetic tree showed two main clusters with Turkana accessions clustering in one cluster and the rest of the accessions in the other cluster. Kwale populations also revealed reciprocal monophyly (<xref ref-type="sec" rid="s11">Supplementary Figure&#x20;S5</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>NeighbourNet network generated using 23,416 SNPs derived from reference-based GBS analysis of Kenyan <italic>Hyphaene compressa</italic> using SplitsTree version 4.17.0.</p>
</caption>
<graphic xlink:href="fgene-13-762202-g006.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Migration Rates Among <italic>H. compressa</italic> Accessions Along the Tana Basin</title>
<p>The highest gene flow was observed from Tharaka and Tana River samples (<italic>m</italic>&#x20;&#x3d; 139.1), followed by Kwale to Tharaka (102.7), Tana River to Kwale (63.1), Tana River to Tharaka (59.9), Tharaka to Kwale (50.3) and Kwale to Tana River (57.7). These results indicate that the gene flow along the Tana basin was mostly asymmetrical (<xref ref-type="sec" rid="s11">Supplementary Figure&#x20;S6</xref>).</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>This study is the first to report the use of SNPs through the GBS approach to characterize <italic>H. compressa</italic> accessions in Kenya<italic>.</italic> SNP markers are very stable, frequent and specific to regions of the genome which makes them ideal for use in marker assisted selection (MAS) and diversity studies to aid future germplasm conservation.</p>
<p>Two comparative methods (reference-based and <italic>de_novo</italic>-based approaches) were used to infer the population structure and genetic diversity of <italic>H</italic>. <italic>compressa</italic>. In the reference-based assembly, <italic>Phoenix dactylifera</italic> was used as a reference genome. This confamilial genome was used because <italic>H. compressa</italic> had no assembled genome at the time of this study. In the absence of a reference genome of the same species (conspecific) or genus (congeneric), a confamilial reference genome can be used to provide similar estimates of diversity (<xref ref-type="bibr" rid="B4">Brandies et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B19">Galla et&#x20;al., 2019</xref>). <xref ref-type="bibr" rid="B19">Galla et&#x20;al. (2019)</xref> further recommends using a confamilial reference genome as the most distant genome ideal for diversity studies. There were differences in the two methods concerning abundance, quality scores and the TS/TV ratios of the SNPs obtained. For example, the highest number of SNPs was observed from the reference-based assembly (23,416) compared to the <italic>de_novo</italic>-based assembly (2096). The reference-based assembly has also been previously demonstrated to outperform <italic>de_novo</italic> assembly in determining the number of SNPs in olive cultivars (<xref ref-type="bibr" rid="B54">D&#x2019;Agostino et&#x20;al., 2018</xref>). Elsewhere, it has been reported that parameters set during assembly and the type of assembly influence the number and depth of SNPs obtained (<xref ref-type="bibr" rid="B55">Bohling, 2020</xref>). Besides, more stringent parameters are normally used for <italic>de_novo</italic> assemblies. GBS of <italic>H. compressa</italic> accessions showed considerable SNP variations with transition SNPs (purine-purine or pyrimidine-pyrimidine) being the most frequent mutations. This high frequency in transition SNPs has also been observed in many plants such as <italic>Capsicum annuum</italic>, <italic>Vigna unguiculata</italic>, <italic>Elaeis guineensis</italic>, and <italic>Camelia sativa</italic> (<xref ref-type="bibr" rid="B44">Pootakham et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B48">Taranto et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B52">Xiong et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B33">Luo et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B24">Hyun et&#x20;al., 2020</xref>), of which the C-T transitions are the most frequent (<xref ref-type="bibr" rid="B14">Edwards et&#x20;al., 2007</xref>). However, low TS/TV ratio was observed in <italic>de_novo</italic> based assembly. This phenomenon has also been observed elsewhere and was attributed to the differences in the SNP calling methods (<xref ref-type="bibr" rid="B46">Shafer et&#x20;al., 2017</xref>). Despite the difference between the two methods, structure analysis and PCA produced congruent results. A similar study that used a <italic>de_novo</italic> approach, a confamilial reference and a congeneric reference to determine the phylogenetic relationship of the <italic>Amaranthus</italic> genus, produced differing SNP counts but similar phylogenetic trees (<xref ref-type="bibr" rid="B56">Stetter and Schmid, 2017</xref>). Other studies have also reported differing SNP abundance between reference-based and <italic>de_novo</italic> assemblies but consistent population clustering (<xref ref-type="bibr" rid="B54">D&#x2019;Agostino et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B46">Shafer et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B56">Stetter and Schmid, 2017</xref>).</p>
<p>STRUCTURE analysis grouped the <italic>H. compressa</italic> accessions into two gene pools. PCA and DAPC were consistent with these structure results. Accessions from Turkana (Northern Kenya) were pooled into cluster 1. Cluster 2 had the highest number of genotypes that included accessions collected along the Tana basin sites (Tharaka Nithi and Tana River) and Kwale. In addition, an admixture of accessions was reported for accessions from Kwale that showed mixed ancestry from Tharaka Nithi and Tana River. This admixture may be due to genetic exchange between Kwale, Tharaka Nithi and Tana river. These accessions also exhibited reciprocal monophyly based on phylogenetic analysis. This corroborates the phenotypic diversity studies on <italic>H. compressa</italic> where accessions from Kwale exhibited the highest phenotypic diversity compared to other regions (<xref ref-type="bibr" rid="B41">Omire et&#x20;al., 2020b</xref>).</p>
<p>The fixation index (<italic>F</italic>
<sub>
<italic>ST</italic>
</sub>) is an informative method for measuring population differentiation among populations (<xref ref-type="bibr" rid="B38">Nassiry et&#x20;al., 2009</xref>). An overall <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> value of 0.074 was reported for <italic>H. compressa</italic> populations in this study. According to <xref ref-type="bibr" rid="B38">Nassiry et&#x20;al. (2009)</xref>, an <italic>F</italic>
<sub>
<italic>ST</italic>
</sub> of 0&#x2013;0.05 is considered small, 0.05&#x2013;0.15 is moderate and 0.15 and above is considered very high. Therefore, <italic>H. compressa</italic> accessions had moderate genetic differentiation. However, <italic>F</italic>
<sub>
<italic>ST</italic>
</sub>, values obtained from STRUCTURE population clustering indicate high genetic differentiation within cluster 1 (accessions from the northern part of Kenya) than cluster 2 (accessions along the Tana Basin). On the other hand, cluster two had higher levels of heterozygosity (<italic>He</italic>) compared to cluster 1. This indicates high diversity in accessions along the Tana basin. The high heterozygosity and lower genetic differentiation between <italic>H</italic>. <italic>compressa</italic> accessions along the Tana Basin (cluster 2) might be due to genetic exchange arising from gene flow. Although Tharaka Nithi is found approximately 163 and 391 miles away from Tana River and Kwale respectively, gene flow between these three counties seems high. This could be due to the flow of the River Tana (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>), which traverses both Tharaka and Tana River counties and possibly serves as means of germplasm dispersion. This could explain why Tharaka samples are close to the Tana River accessions on the PCA and the high mixed ancestry as demonstrated by DAPC and STRUCTURE analysis. River Tana is the longest river and the most important drainage basin in Kenya. The river drains from the Kenyan highlands to the Eastern ASAL plateaus and coastal Kenya (<xref ref-type="bibr" rid="B30">Kitheka and Ongwenyi, 2002</xref>). Since <italic>H. compressa</italic> grows in riverine areas, seed dispersal through the river is an important factor influencing the population structure of <italic>H. compressa</italic> at the Kenyan Coast. Seed dispersal is essential for biodiversity conservation by driving plant gene flow, population dynamics and functional connectivity between regions (<xref ref-type="bibr" rid="B49">Traveset and Rodr&#xed;guez-P&#xe9;rez, 2018</xref>). Systematic seed dispersal favours gene flow, increases genetic diversity and lowers the genetic differentiation among populations (<xref ref-type="bibr" rid="B43">Paschoa et&#x20;al., 2018</xref>). Migration rates using MIGRATE-n indicate that there is asymmetrical gene flow along the Tana basin. This supports the hypothesis that seed dispersal along the Tana River drives the population structure of <italic>H. compressa</italic> along the Coast. In addition, high migration rates were observed between Kwale and Tharaka an observation that is confirmed by phylogenetic analysis whereby some Kwale accessions clustered with Tharaka accessions.</p>
<p>There is restricted gene flow into or out of Turkana, which may cause differentiation of its population from the other populations. This was supported by STRUCTURE analysis, PCA, DAPC and neighbor net network, which clustered Turkana distinctly from the rest of the populations. This differentiation may be attributed to the physical distance between Turkana and the other populations. Isolation of Turkana populations inhibits them from mating with the other populations. Turkana is found in the far-flung northern part of Kenya and is considered 100% dryland with scarce rain fed agriculture (<xref ref-type="bibr" rid="B3">Barrow and Mogaka, 2007</xref>). In addition, the selection pressures in Turkana differ from those present in the other regions.</p>
<p>The negative <italic>F</italic>
<sub>
<italic>IS</italic>
</sub> values obtained for <italic>H</italic>. <italic>compressa</italic> populations indicate low levels of inbreeding, high diversity and moderate connectivity between the populations. This may be influenced by the mating system. <italic>Hyphaene compressa</italic> is a dioecious plant (<xref ref-type="bibr" rid="B47">Stauffer et&#x20;al., 2014</xref>), a condition that favors obligate cross pollination which inturn increases intrapopulation genetic diversity (<xref ref-type="bibr" rid="B43">Paschoa et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B37">Muyle et&#x20;al., 2020</xref>). Dioecy is one of the adaptations in plants that promote outbreeding (<xref ref-type="bibr" rid="B7">Charlesworth, 2006</xref>). High genetic diversity and low inbreeding in <italic>H. compressa</italic> was also supported by AMOVA results which showed higher (92.7%) within population diversity than among population diversity (7.3%).</p>
<p>The understanding of the genetic diversity and population structure within <italic>H. compressa</italic> provides useful information for future selection and appropriate conservation strategies. High priority should be given to the conservation of all populations with high genetic diversity. The conservation of <italic>H. compressa</italic> must consider the two identified clusters to ensure that the high diversity within populations is retained. This can be achieved by maximum collection and <italic>ex situ</italic> conservation of germplasm especially for cluster 2 which had the most diversity.</p>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>This study was able to show the genetic diversity and population structure of <italic>H. compressa</italic> using the GBS approach. <italic>Hyphaene compressa</italic> in Kenyan ASALs is delineated into two gene pools. Cluster 1 comprising accessions in the north of Kenya while cluster 2 comprising accessions found along the River Tana basin. Further, accessions from the Tana basin are more diverse than those found in the northern part of Kenya. In addition, the results indicate that <italic>H. compressa</italic> accessions are interconnected with high gene flow and moderate genetic differentiation, evidenced by high within-population variation than among population variation. The high within population diversity can be harnessed for future breeding and improvement programs for various adaptive traits in <italic>H. compressa.</italic>
</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>The sequence data generated from this study are archived in the NCBI SRA under BioProject accession number PRJNA756042 (<ext-link ext-link-type="uri" xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA756042/">https://www.ncbi.nlm.nih.gov/bioproject/PRJNA756042/</ext-link>)</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>CM, JN, NB, and LW conceived the study, CM, JN, NB, SO, and AO designed the analysis, AO, CM, JN, and NB collected the data, CM, AO, SO, NB, and JN analyzed the data, AO drafted the manuscript with significant contributions from all the authors. All authors contributed to data interpretation and approval of the&#x20;paper.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>This work was supported by a grant from The National Research Fund (NRF) Kenya, Grant Number NRF\1\MMC\285.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>Special gratitude goes to Kenya Forestry Service, National Museums of Kenya, Nuts and Oil Crops Directorate and Anglican Development Services in Lodwar Kenya for their guidance during sampling.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2022.762202/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2022.762202/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material>
<label>Supplementary Figure S1</label>
<caption>
<p>Single Nucleotide Polymorphism (SNP) qualities after filtering the VCF file obtained from <italic>de_novo</italic>-based assembly of GBS data showing the depth per individual. <bold>(A)</bold>, observed heterozygosity <bold>(B)</bold>, Mean depth <bold>(C)</bold> and frequency of missing data per individual <bold>(D)</bold> for <italic>Hyphaene compressa</italic> accessions from Kenya.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S2</label>
<caption>
<p>Single Nucleotide Polymorphism (SNP) qualities after filtering the VCF file obtained from reference-based assembly of GBS data showing the depth per individual. <bold>(A)</bold>, observed heterozygosity <bold>(B)</bold>, Mean depth <bold>(C)</bold> and frequency of missing data per individual <bold>(D)</bold> for <italic>Hyphaene compressa</italic> accessions from Kenya.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S3</label>
<caption>
<p>Optimal Delta k values for different k values inferred during STRUCTURE analysis of Kenyan Hyphaene compressa showing the optimal delta k at k &#x003D; 2 for the reference-based assembly <bold>(A)</bold> and the de_novo based assembly <bold>(B)</bold>.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S4</label>
<caption>
<p>STRUCTURE bar plot of admixture model population assignment of 96 <italic>Hyphaene compressa</italic> accessions from Kenya showing three clusters based on 2096 Single Nucleotide Polymorphisms (SNPs) for the de-novo assembly <bold>(A)</bold> and 23416 SNPs based on reference assembly <bold>(B)</bold>. A combination of different colors represents admixed populations. In these structure plots, Tharaka and Tana River accessions have been placed in one cluster.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S5</label>
<caption>
<p>Unrooted UPGMA distance tree inferred using 23416 SNPs based on the reference based assembly of <italic>H. compressa</italic> accessions.</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S6</label>
<caption>
<p>Migration rates between Tharaka, Tana River and Kwale using MIGRATE-n software. The direction of the arrow indicate the direction of gene flow.</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="Image3.TIFF" id="SM1" mimetype="application/TIFF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image6.tif" id="SM2" mimetype="application/tif" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.TIF" id="SM3" mimetype="application/TIF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.TIF" id="SM4" mimetype="application/TIF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image5.png" id="SM5" mimetype="application/png" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.DOCX" id="SM6" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.xlsx" id="SM7" mimetype="application/xlsx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image4.TIFF" id="SM8" mimetype="application/TIFF" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amwatta</surname>
<given-names>C. J.&#x20;M.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Diversity of Use of Doum (Hyphaene Compressa) in Kenya</article-title>. <source>Palms</source> <volume>48</volume> (<issue>4</issue>), <fpage>184</fpage>&#x2013;<lpage>190</lpage>. </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Andersen</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>L&#xfc;bberstedt</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Functional Markers in Plants</article-title>. <source>Trends Plant Sci.</source> <volume>8</volume> (<issue>11</issue>), <fpage>554</fpage>&#x2013;<lpage>560</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2003.09.010</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Barrow</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mogaka</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Kenya&#x2019;s Drylands - Wastelands or an Undervalued National Economic Resource</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.iucn.org/sites/dev/files/import/downloads/kenya_dryland_value_2007.pdf">https://www.iucn.org/sites/dev/files/import/downloads/kenya_dryland_value_2007.pdf</ext-link> (Accessed June 24, 2021)</comment>. </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bohling</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Evaluating the effect of reference genome divergence on the analysis of empirical RADseq datasets</article-title>. <source>Ecol. Evol.</source> <volume>10</volume>, <fpage>7585</fpage>&#x2013;<lpage>7601</lpage>. <pub-id pub-id-type="doi">10.1002/ece3.6483</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brandies</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Peel</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Hogg</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Belov</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The Value of Reference Genomes in the Conservation of Threatened Species</article-title>. <source>Genes (Basel)</source> <volume>10</volume>, <fpage>846</fpage>. <pub-id pub-id-type="doi">10.3390/genes10110846</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brunet</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Larson-Rabin</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Stewart</surname>
<given-names>C. M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Distribution of Genetic Diversity within and Among Populations of the Rocky Mountain Columbine: The Impact of Gene Flow, Pollinators, and Mating System</article-title>. <source>Int. J.&#x20;Plant Sci.</source> <volume>173</volume> (<issue>5</issue>), <fpage>484</fpage>&#x2013;<lpage>494</lpage>. <pub-id pub-id-type="doi">10.1086/665263</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burghardt</surname>
<given-names>L. T.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Tiffin</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A Guide to Genome-wide Association Mapping in Plants</article-title>. <source>Curr. Protoc. Plant Biol.</source> <volume>2</volume>, <fpage>22</fpage>&#x2013;<lpage>38</lpage>. <pub-id pub-id-type="doi">10.1002/cppb.20041</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Charlesworth</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Evolution of Plant Breeding Systems</article-title>. <source>Curr. Biol.</source> <volume>16</volume> (<issue>17</issue>), <fpage>R726</fpage>&#x2013;<lpage>R735</lpage>. <pub-id pub-id-type="doi">10.1016/j.cub.2006.07.068</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cosiaux</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gardiner</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Couvreur</surname>
<given-names>T. L.</given-names>
</name>
</person-group> (<year>2017</year>). <source>Hyphaene Compressa, the IUCN Red List of Threatened Species</source>. <publisher-name>IUCN Red List</publisher-name>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2305/IUCN.UK.2017-3.RLTS.T95317478A95317481.en">https://doi.org/10.2305/IUCN.UK.2017-3.RLTS.T95317478A95317481.en</ext-link> (Accessed September 2, 2017)</comment>. </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cosiaux</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gardiner</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Stauffer</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Bachman</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Sonk&#xe9;</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Baker</surname>
<given-names>W. J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Low Extinction Risk for an Important Plant Resource: Conservation Assessments of continental African Palms (Arecaceae/Palmae)</article-title>. <source>Biol. Conservation</source> <volume>221</volume>, <fpage>323</fpage>&#x2013;<lpage>333</lpage>. <pub-id pub-id-type="doi">10.1016/j.biocon.2018.02.025</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#x2019;Agostino</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Taranto</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Camposeo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mangini</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Fanelli</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gadaleta</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>GBS-derived SNP catalogue unveiled wide genetic variability and geographical relationships of Italian olive cultivars</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-34207-y</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danecek</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Auton</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Abecasis</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Albers</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Banks</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>DePristo</surname>
<given-names>M. A.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>The Variant Call Format and VCFtools</article-title>. <source>Bioinformatics</source> <volume>27</volume> (<issue>15</issue>), <fpage>2156</fpage>&#x2013;<lpage>2158</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davey</surname>
<given-names>J.&#x20;W.</given-names>
</name>
<name>
<surname>Hohenlohe</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Etter</surname>
<given-names>P. D.</given-names>
</name>
<name>
<surname>Boone</surname>
<given-names>J.&#x20;Q.</given-names>
</name>
<name>
<surname>Catchen</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Blaxter</surname>
<given-names>M. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Genome-wide Genetic Marker Discovery and Genotyping Using Next-Generation Sequencing</article-title>. <source>Nat. Rev. Genet.</source> <volume>12</volume> (<issue>7</issue>), <fpage>499</fpage>&#x2013;<lpage>510</lpage>. <pub-id pub-id-type="doi">10.1038/nrg3012</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Earl</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>VonHoldt</surname>
<given-names>B. M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>STRUCTURE HARVESTER: A Website and Program for Visualizing STRUCTURE Output and Implementing the Evanno Method</article-title>. <source>Conservation Genet. Resour.</source> <volume>4</volume>, <fpage>359</fpage>&#x2013;<lpage>361</lpage>. <pub-id pub-id-type="doi">10.1007/s12686-011-9548-7</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eaton</surname>
<given-names>D. A. R.</given-names>
</name>
<name>
<surname>Overcast</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Ipyrad: Interactive Assembly and Analysis of RADseq Datasets</article-title>. <source>Bioinformatics</source> <volume>36</volume> (<issue>8</issue>), <fpage>2592</fpage>&#x2013;<lpage>2594</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz966</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Edwards</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Forster</surname>
<given-names>J.&#x20;W.</given-names>
</name>
<name>
<surname>Chagn&#xe9;</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Batley</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2007</year>). &#x201c;<article-title>What Are SNPs</article-title>,&#x201d; in <source>Association Mapping in Plants</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Oraguzie</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Rikkerink</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Gardiner</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>de Silva</surname>
<given-names>H.</given-names>
</name>
</person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>41</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1007/978-0-387-36011-9_3</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elshire</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Glaubitz</surname>
<given-names>J.&#x20;C.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Poland</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Kawamoto</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Buckler</surname>
<given-names>E. S.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>A Robust, Simple Genotyping-By-Sequencing (GBS) Approach for High Diversity Species</article-title>. <source>Plos One</source> <volume>6</volume> (<issue>5</issue>), <fpage>e19379</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0019379</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evanno</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Regnaut</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Goudet</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Detecting the Number of Clusters of Individuals Using the Software STRUCTURE: A Simulation Study</article-title>. <source>Mol. Ecol.</source> <volume>14</volume> (<issue>8</issue>), <fpage>2611</fpage>&#x2013;<lpage>2620</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-294X.2005.02553.x</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Excoffier</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lischer</surname>
<given-names>H. E. L.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Arlequin Suite Ver 3.5: A New Series of Programs to Perform Population Genetics Analyses under Linux and Windows</article-title>. <source>Mol. Ecol. Resour.</source> <volume>10</volume>, <fpage>564</fpage>&#x2013;<lpage>567</lpage>. <pub-id pub-id-type="doi">10.1111/j.1755-0998.2010.02847.x</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Francis</surname>
<given-names>R. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Pophelper: an R Package and Web App to Analyse and Visualize Population Structure</article-title>. <source>Mol. Ecol. Resour.</source> <volume>17</volume> (<issue>1</issue>), <fpage>27</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1111/1755-0998.12509</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Galla</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Forsdick</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hoeppner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Knapp</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Maloney</surname>
<given-names>R. F.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Reference Genomes from Distantly Related Species Can Be Used for Discovery of Single Nucleotide Polymorphisms to Inform Conservation Management</article-title>. <source>Genes</source> <volume>10</volume> (<issue>9</issue>), <fpage>9</fpage>. <pub-id pub-id-type="doi">10.3390/genes10010009</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ganie</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Upadhyay</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Prasad Sharma</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Authentication of Medicinal Plants by DNA Markers</article-title>. <source>Plant Gene</source> <volume>4</volume>, <fpage>83</fpage>&#x2013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1016/j.plgene.2015.10.002</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hazzouri</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Gros-Balthazard</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Flowers</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Copetti</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lemansour</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lebrun</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Genome-wide Association Mapping of Date palm Fruit Traits</article-title>. <source>Nat. Commun.</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-019-12604-9</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Laroche</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>Z.-X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Genotyping-by-sequencing (GBS), an Ultimate Marker-Assisted Selection (MAS) Tool to Accelerate Plant Breeding</article-title>. <source>Front. Plant Sci.</source> <volume>5</volume> (<issue>484</issue>), <fpage>1</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00484</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huson</surname>
<given-names>D. H.</given-names>
</name>
<name>
<surname>Bryant</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Application of Phylogenetic Networks in Evolutionary Studies</article-title>. <source>Mol. Biol. Evol.</source> <volume>23</volume> (<issue>2</issue>), <fpage>254</fpage>&#x2013;<lpage>267</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msj030</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hyun</surname>
<given-names>D. Y.</given-names>
</name>
<name>
<surname>Sebastin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>G.-A.</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>M.-J.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S. H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Genotyping-by-Sequencing Derived Single Nucleotide Polymorphisms Provide the First Well-Resolved Phylogeny for the Genus Triticum (Poaceae)</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume> (<issue>688</issue>), <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.3389/fpls.2020.00688</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Nomadism and Desertification in Africa and the Middle East</article-title>. <source>GeoJournal</source> <volume>31</volume> (<issue>1</issue>), <fpage>51</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1007/bf00815903</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jombart</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Adegenet: a R Package for the Multivariate Analysis of Genetic Markers</article-title>. <source>Bioinformatics</source> <volume>24</volume> (<issue>11</issue>), <fpage>1403</fpage>&#x2013;<lpage>1405</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btn129</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kahn</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Luxereau</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Doum palm Habit and Leaf Collecting Practices in Niger</article-title>. <source>Palms</source> <volume>52</volume> (<issue>1</issue>), <fpage>23</fpage>&#x2013;<lpage>29</lpage>. </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Al-qurainy</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Nadeem</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Biotechnological Approaches for Conservation and Improvement of Rare and Endangered Plants of Saudi Arabia</article-title>. <source>Saudi J.&#x20;Biol. Sci.</source> <volume>19</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1016/j.sjbs.2011.11.001</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kigomo</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2001</year>). &#x201c;<article-title>State of forest Genetic Resources in Kenya</article-title>,&#x201d; in <conf-name>Forest Genetic Resources Working Papers FGR/18E; Issue The sub-regional workshop FAO/IPGRI/ICRAF on the conservation, management, sustainable utilization and enhancement of forest genetic resources in Sahelian and North-Sudanian Africa</conf-name>, <conf-loc>Ouagadougou, Burkina Faso</conf-loc>, <conf-date>22-24 September 1998</conf-date>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://www.fao.org/3/ab396e/ab396e.pdf">http://www.fao.org/3/ab396e/ab396e.pdf</ext-link>
</comment>. </citation>
</ref>
<ref id="B30">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Kitheka</surname>
<given-names>J.&#x20;U.</given-names>
</name>
<name>
<surname>Ongwenyi</surname>
<given-names>G. S.</given-names>
</name>
</person-group> (<year>2002</year>). &#x201c;<article-title>The Tana River Basin and the Opportunity for Research on the Land-Ocean Interaction in the Tana Delta</article-title>,&#x201d; in <source>Aquadocs</source>. <publisher-loc>Nairobi, Kenya</publisher-loc>: <publisher-name>University of Nairobi</publisher-name>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://hdl.handle.net/1834/7842">http://hdl.handle.net/1834/7842</ext-link>
</comment>. </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klimova</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ortega-Rubio</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vendrami</surname>
<given-names>D. L. J.</given-names>
</name>
<name>
<surname>Hoffman</surname>
<given-names>J.&#x20;I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Genotyping by Sequencing Reveals Contrasting Patterns of Population Structure, Ecologically Mediated Divergence, and Long-Distance Dispersal in North American Palms</article-title>. <source>Ecol. Evol.</source> <volume>8</volume> (<issue>11</issue>), <fpage>5873</fpage>&#x2013;<lpage>5890</lpage>. <pub-id pub-id-type="doi">10.1002/ece3.4125</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Durbin</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Fast and Accurate Short Read Alignment with Burrows-Wheeler Transform</article-title>. <source>Bioinformatics</source> <volume>25</volume> (<issue>14</issue>), <fpage>1754</fpage>&#x2013;<lpage>1760</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Brock</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Dyer</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Kutchan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Schachtman</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Augustin</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Genetic Diversity and Population Structure of a Camelina Sativa spring Panel</article-title>. <source>Front. Plant Sci.</source> <volume>10</volume> (<issue>February</issue>), <fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.3389/fpls.2019.00184</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Maundu</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Tengnas</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2005</year>). &#x201c;<article-title>Useful Trees and Shrubs for Kenya</article-title>,&#x201d; in <source>Technical Handbook Number 35</source> (<publisher-loc>Nairobi, Kenya</publisher-loc>: <publisher-name>World Agroforestry Centre- Eastern and Central Africa Regional Programme</publisher-name>). </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mokhtar</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Adawy</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>El-assal</surname>
<given-names>S. E.-D. S.</given-names>
</name>
<name>
<surname>Hussein</surname>
<given-names>E. H. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Genic and Intergenic SSR Database Generation, SNPs Determination and Pathway Annotations, in Date Palm (Phoenix Dactylifera L.)</article-title>. <source>Plos One</source> <volume>11</volume> (<issue>7</issue>), <fpage>e0159268</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0159268</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muyle</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zemp</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Mollion</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gallina</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Tavares</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Dioecy Is Associated with High Genetic Diversity and Adaptation Rates in the Plant Genus Silene</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume> (<issue>3</issue>), <fpage>805</fpage>&#x2013;<lpage>818</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msaa229</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nassiry</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Javanmard</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tohidi</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Application of Statistical Procedures for Analysis of Genetic Diversity in Domestic Animal Populations</article-title>. <source>Am. J.&#x20;Anim. Vet. Sci.</source> <volume>4</volume> (<issue>4</issue>), <fpage>136</fpage>&#x2013;<lpage>141</lpage>. <pub-id pub-id-type="doi">10.3844/ajavsp.2009.136.141</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nkhoma</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Shimelis</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Laing</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Shayanowako</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mathew</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessing the Genetic Diversity of Cowpea [Vigna Unguiculata (L.) Walp.] Germplasm Collections Using Phenotypic Traits and SNP Markers</article-title>. <source>BMC Genet.</source> <volume>21</volume> (<issue>110</issue>), <fpage>1</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1186/s12863-020-00914-7</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Omire</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Budambula</surname>
<given-names>N. L. M.</given-names>
</name>
<name>
<surname>Neondo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gituru</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mweu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2020a</year>). <article-title>Phenotypic Diversity of Doum Palm (Hyphaene Compressa), a Semi&#x2010;Domesticated Palm in the Arid and Semi&#x2010;Arid Regions of Kenya</article-title>. <source>Scientifica</source> <volume>2020</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1155/2020/4920830</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Omire</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Neondo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Budambula</surname>
<given-names>N. L.</given-names>
</name>
<name>
<surname>Gituru</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mweu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Hyphaene Compressa, an Important palm in the Arid and Semi-arid Regions of Kenya</article-title>. <source>Eth Res. Appl.</source> <volume>20</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.32859/era.20.4.1-15</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ortiz</surname>
<given-names>E. M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>vcf2phylipV. 2.0: Convert a VCF Matrix into Several Matrix Formats for Phylogenetic Analysis</article-title>. <pub-id pub-id-type="doi">10.5281/zenodo.2540861</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paschoa</surname>
<given-names>R. P. d.</given-names>
</name>
<name>
<surname>Christ</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Valente</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>M. F. d. S.</given-names>
</name>
<name>
<surname>Miranda</surname>
<given-names>F. D. d.</given-names>
</name>
<name>
<surname>Garbin</surname>
<given-names>M. L.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Genetic Diversity of Populations of the Dioecious Myrsine Coriacea (Primulaceae) in the atlantic forest</article-title>. <source>Acta Bot. Bras.</source> <volume>32</volume>, <fpage>376</fpage>&#x2013;<lpage>385</lpage>. <pub-id pub-id-type="doi">10.1590/0102-33062017abb0355</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pootakham</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Jomchai</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Ruang-areerate</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Shearman</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Sonthirod</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Sangsrakru</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Genome-wide SNP Discovery and Identification of QTL Associated with Agronomic Traits in Oil palm Using Genotyping-By-Sequencing (GBS)</article-title>. <source>Genomics</source> <volume>105</volume> (<issue>5&#x2013;6</issue>), <fpage>288</fpage>&#x2013;<lpage>295</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2015.02.002</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pritchard</surname>
<given-names>J.&#x20;K.</given-names>
</name>
<name>
<surname>Stephens</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Donnelly</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Inference of Population Structure Using Multilocus Genotype Data</article-title>. <source>Genetics</source> <volume>155</volume> (<issue>2</issue>), <fpage>945</fpage>&#x2013;<lpage>959</lpage>. <pub-id pub-id-type="doi">10.1007/s10681-008-9788-010.1093/genetics/155.2.945</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shafer</surname>
<given-names>A. B. A.</given-names>
</name>
<name>
<surname>Peart</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Tusso</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Maayan</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Brelsford</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wheat</surname>
<given-names>C. W.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Bioinformatic Processing of RAD&#x2010;seq Data Dramatically Impacts Downstream Population Genetic Inference</article-title>. <source>Methods Ecol. Evol.</source> <volume>8</volume>, <fpage>907</fpage>&#x2013;<lpage>917</lpage>. <pub-id pub-id-type="doi">10.1111/2041-210X.12700</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stauffer</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ouattara</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Stork</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Monocotyledons 2 (Anthericaceae - Palmae)</article-title>. <source>Tropical African Flowering Plants: ecology and distribution</source> <volume>8</volume> (<issue>1</issue>), <fpage>326</fpage>&#x2013;<lpage>354</lpage>. </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stetter</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Schmid</surname>
<given-names>K. J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Analysis of phylogenetic relationships and genome size evolution of the Amaranthus genus using GBS indicates the ancestors of an ancient crop</article-title>. <source>Methods Phylogenet. Evol.</source> <volume>109</volume>, <fpage>80</fpage>&#x2013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2016.12.029</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Taranto</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>D&#x2019;Agostino</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Greco</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Cardi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tripodi</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Genome-wide SNP Discovery and Population Structure Analysis in Pepper (Capsicum Annuum) Using Genotyping by Sequencing</article-title>. <source>BMC Genomics</source> <volume>17</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1186/s12864-016-3297-7</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Traveset</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rodr&#xed;guez-P&#xe9;rez</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Seed Dispersal</article-title>,&#x201d; in <source>Encyclopedia of Ecology</source>. Editor <person-group person-group-type="editor">
<name>
<surname>Fath</surname>
<given-names>B.</given-names>
</name>
</person-group>. <edition>2nd ed.</edition> (<publisher-loc>New York</publisher-loc>: <publisher-name>Elsevier</publisher-name>), <fpage>592</fpage>&#x2013;<lpage>599</lpage>. <comment>Issue October 2017</comment>. <pub-id pub-id-type="doi">10.1016/B978-0-12-409548-9.10950-9</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Uhl</surname>
<given-names>N. W.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>palm</article-title>. <source>Encyclopedia Britanica</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.britannica.com/plant/palm-tree">https://www.britannica.com/plant/palm-tree</ext-link> (Accessed July 27, 2021)</comment>. </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wallace</surname>
<given-names>J.&#x20;G.</given-names>
</name>
<name>
<surname>Mitchell</surname>
<given-names>S. E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Genotyping&#x2010;by&#x2010;Sequencing</article-title>. <source>Curr. Protoc. Plant Biol.</source> <volume>2</volume> (<issue>March</issue>), <fpage>64</fpage>&#x2013;<lpage>77</lpage>. <pub-id pub-id-type="doi">10.1002/cppb.20042</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wickham</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Averick</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bryan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>McGowan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fran&#xe7;ois</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Welcome to the Tidyverse</article-title>. <source>Joss</source> <volume>4</volume> (<issue>43</issue>), <fpage>1686</fpage>. <pub-id pub-id-type="doi">10.21105/joss.01686</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mou</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Motes</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Genetic Diversity and Population Structure of Cowpea (Vigna Unguiculata L. Walp)</article-title>. <source>PLoS ONE</source> <volume>11</volume> (<issue>8</issue>), <fpage>e0160941</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0160941</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Levine</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gogarten</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Laurie</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Weir</surname>
<given-names>B. S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A High-Performance Computing Toolset for Relatedness and Principal Component Analysis of SNP Data</article-title>. <source>Bioinformatics</source> <volume>28</volume> (<issue>24</issue>), <fpage>3326</fpage>&#x2013;<lpage>3328</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts606</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>