<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1337736</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Assessing the genetic integrity of sugarcane germplasm in the USDA-ARS National Plant Germplasm System collection using single-dose SNP markers</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Park</surname>
<given-names>Sunchung</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/596985"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhang</surname>
<given-names>Dapeng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1081125"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Ali</surname>
<given-names>Gul Shad</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2293640"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Sustainable Perennial Crops Laboratory, United States Department of Agriculture, Agriculture Research Service</institution>, <addr-line>Beltsville, MD</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Subtropical Horticulture Research Station, United States Department of Agriculture, Agriculture Research Service</institution>, <addr-line>Miami, FL</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Manohar Chakrabarti, The University of Texas Rio Grande Valley, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Prathima Perumal Thirugnanasambandam, Indian Council of Agricultural Research, Coimbatore, India</p>
<p>Dong-Liang Huang, Guangxi Academy of Agricultural Sciences, China</p>
<p>Avinash Singode, Indian Council of Agricultural Research (ICAR), India</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Gul Shad Ali, <email xlink:href="mailto:Gul.Ali@usda.gov">Gul.Ali@usda.gov</email>; Dapeng Zhang, <email xlink:href="mailto:dapeng.zhang@usda.gov">dapeng.zhang@usda.gov</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>01</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1337736</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>11</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>12</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Park, Zhang and Ali</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Park, Zhang and Ali</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The World Collection of Sugarcane and Related Grasses, maintained at the USDA-ARS in Miami, FL, is one of the largest sugarcane germplasm repositories in the world. However, the genetic integrity of the <italic>Saccharum</italic> spp. germplasm in this collection has not been fully analyzed. In this study, we employed a single-dose SNP panel to genotype 901 sugarcane accessions, representing six <italic>Saccharum</italic> species and various hybrids. Our analysis uncovered a high rate of clone mislabeling in the collection. Specifically, we identified 86 groups of duplicates, characterized by identical SNP genotypes, which encompassed 211 accessions (23% of the total clones), while 135 groups, constituting 471 clones (52% of the total), exhibited near-identical genotypes. In addition, twenty-seven homonymous groups were detected, which shared the same clone name but differed in SNP genotypes. Hierarchical analysis of population structure partitioned the <italic>Saccharum</italic> germplasm into five clusters, corresponding to <italic>S. barberi, S. sinense, S. officinarum, S. spontaneum</italic> and <italic>S. robustum/S. edule</italic>. An assignment test, based on the five <italic>Saccharum</italic> species, enabled correcting 141 instances of mislabeled species memberships and inaccuracies. Moreover, we clarified the species membership and parentage of 298 clones that had ambiguous passport records (e.g., &#x2018;<italic>Saccharum spp</italic>&#x2019;, &#x2018;unknown&#x2019;, and &#x2018;hybrid&#x2019;). Population structure and genetic diversity in these five species were further supported by Principal Coordinate Analysis and neighbor-joining clustering analysis. Analysis of Molecular Variance revealed that within-species genetic variations accounted for 85% of the total molecular variance, with the remaining 15% attributed to among-species genetic variations. The single-dose SNP markers developed in this study offer a robust tool for characterizing sugarcane germplasm worldwide. These findings have important implications for sugarcane genebank management, germplasm exchange, and crop genetic improvement.</p>
</abstract>
<kwd-group>
<kwd>
<italic>Saccharum</italic>
</kwd>
<kwd>germplasm</kwd>
<kwd>sugarcane</kwd>
<kwd>genetic diversity</kwd>
<kwd>population structure</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="56"/>
<page-count count="14"/>
<word-count count="8121"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Genetics, Epigenetics and Chromosome Biology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Sugarcane (<italic>Saccharum</italic> spp.) is a prolific energy crop that serves as a substantial source of sugar, biofuel, and other industrial chemicals (<xref ref-type="bibr" rid="B14">Formann et&#xa0;al., 2020</xref>). It is cultivated worldwide in over 95 countries across 26.4 million hectares, with a total production of 1.86 billion metric tons and a gross production value of $96.5 billion dollars (<xref ref-type="bibr" rid="B12">FAO, 2023</xref>). Sugarcane plays a crucial role in the economies of many tropical and subtropical countries, meeting nearly 80% of global sugar demands for food consumption and accounting for approximately 40% of the world&#x2019;s bioethanol needs (<xref ref-type="bibr" rid="B26">Lam et&#xa0;al., 2009</xref>). Furthermore, lignocellulosic biomass derived from sugarcane and energy cane is recognized as a promising feedstock for biofuel production. As the demand for sugar and biofuel continues to rise, a challenge for sugarcane breeding programs is to develop improved varieties with higher yield, sucrose content, disease resistance, improved ratooning ability and adaptability to environmental stresses. Genetic diversity is crucial in developing such varieties to unlock the full potential of sugarcane as a feedstock for both sugar and fiber production. (<xref ref-type="bibr" rid="B26">Lam et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B21">Hoang et&#xa0;al., 2015</xref>).Sugarcane species belong to the grass family <italic>Poacea</italic>, genus <italic>Saccharum</italic>, and share genetic similarities with <italic>Sorghum</italic> and other grasses (<xref ref-type="bibr" rid="B44">Spangler et&#xa0;al., 1999</xref>). Within the <italic>Saccharum</italic> genus, six main species are recognized: two wild species, <italic>S. spontaneum</italic> (2<italic>n</italic> = 40 -128, <italic>x</italic> = 8) and <italic>S. robustum</italic> (2<italic>n</italic> = 60 &#x2013; 80), and four cultivated species, <italic>S. officinarum</italic> (2<italic>n</italic> = 80, <italic>x</italic> =10), <italic>S. barberi</italic> (2<italic>n</italic> = 81 -124), <italic>S. sinense</italic> (2<italic>n</italic> = 111 &#x2013; 120), and <italic>S. edule</italic> (2<italic>n</italic> = 60, 70, 80) (<xref ref-type="bibr" rid="B31">Moore et&#xa0;al., 2013</xref>). Genetic studies suggest that <italic>S. officinarum</italic> and <italic>S. edule</italic> originated from <italic>S. robustum</italic> (<xref ref-type="bibr" rid="B17">Grivet et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B18">Grivet et&#xa0;al., 2006</xref>) and that <italic>S. sinense</italic> and <italic>S. barberi</italic> are interspecific hybrids resulting from a cross between <italic>S. officinarum</italic> an <italic>S. spontaneum</italic>, with 32 -39% of their genomes derived from <italic>S. spontaneum</italic> (<xref ref-type="bibr" rid="B7">D&#x2019;Hont et&#xa0;al., 1996</xref>; <xref ref-type="bibr" rid="B36">Piperidis et&#xa0;al., 2010</xref>). Most modern sugarcane cultivars are complex polyploids (<italic>2n = 4x</italic> to 12<italic>x</italic>, totaling 100 &#x2013; 128 chromosomes), resulting from interspecific crosses between sugar-rich <italic>S. officinarum</italic> and <italic>S. spontaneum</italic> with disease resistance, vigor and other agronomic traits (<xref ref-type="bibr" rid="B36">Piperidis et&#xa0;al., 2010</xref>).</p>
<p>Since the early 1970s, sugarcane productivity has steadily increased, largely attributed to improved varieties and agronomic practices (<xref ref-type="bibr" rid="B31">Moore et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B19">Hale et&#xa0;al., 2022</xref>). However, the sugarcane industry faces challenges posed by diseases, pests, adaptability to different soil types, water availability and environmental stresses, underscoring the need for the development of new and resilient sugarcane varieties with high sucrose content. The current repertoire of modern sugarcane cultivars is the result of crosses made in the early 1900s, involving fewer than 20 <italic>S. officinarum</italic> and <italic>S. spontaneum</italic> clones as parents (<xref ref-type="bibr" rid="B6">Deren, 1995</xref>; <xref ref-type="bibr" rid="B40">Raboin et&#xa0;al., 2006</xref>), essentially resulting in a monoculture of a few dominant sugarcane varieties grown across large geographic areas, and making them vulnerable to disease and pest outbreaks. To enhance the resilience of sugarcane varieties, it is important to increase the genetic diversity of sugarcane germplasm. Recognizing the importance of landraces and wild relatives as sources of novel genetic traits, efforts for enhancing genetic diversity should be focused on introgression of genes from landraces, wild species within <italic>Saccharum</italic> species complex, and crossable wild relatives such as <italic>Miscanthus</italic> and <italic>Tripidium</italic>. The World Collection of Sugarcanes and Related Grasses (WCSRG), maintained by the United States Department of Agriculture (USDA), Agriculture Research Service (ARS), Subtropical Horticulture Research Station (SHRS), serves as a repository for one of the world largest collections of sugarcane and its wild relatives, originating from various geographical regions. This collection has been used in breeding programs and biological studies to improve sugarcane varieties (<xref ref-type="bibr" rid="B32">Nayak et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B55">Zhang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B52">You et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B13">Fickett et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B19">Hale et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B46">Wang et&#xa0;al., 2022</xref>). Moreover, as a USDA National Plant Germplasm collection, the clones are freely distributed to international sugarcane community. From 2010 to 2021, a total of 9439 cuttings of various <italic>Saccharum</italic> spp., and 298 cuttings of 4 <italic>Tripidium</italic> spp., were distributed to researchers and breeders in the USA (44%) and internationally (56%) (<xref ref-type="bibr" rid="B20">Hemaprabha et&#xa0;al., 2022</xref>).</p>
<p>The WCSRG currently houses approximately 1164 accessions, the majority of which belong to <italic>Saccharum</italic> spp, including 307 <italic>S. spontaneum</italic> accessions, 158 <italic>S. officinarum</italic> accessions, 127 <italic>S. hybrid</italic> accessions, 81 <italic>S. robustum</italic> accessions, 48 <italic>S. sinense</italic> accessions, and 33 <italic>S. barberi</italic> accessions. These accessions originated from various geoclimatic regions and likely harbor genes for adaptation to different climatic stresses, pests, and diseases. Ample information on genetic diversity and population structure within this collection has been generated using molecular markers (<xref ref-type="bibr" rid="B4">Brown et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B32">Nayak et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B13">Fickett et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B49">Xiong et&#xa0;al., 2022</xref>) and candidate genes (<xref ref-type="bibr" rid="B33">Parco et&#xa0;al., 2017</xref>). Based on simple sequence repeat (SSR) genotyping results, a core collection including 300 accessions was proposed (<xref ref-type="bibr" rid="B32">Nayak et&#xa0;al., 2014</xref>). Furthermore, target enrichment sequencing was performed on 307 germplasm accessions from this collection, leading to the identification of ancestor of ancient and modern hybrids in <italic>Saccharum</italic> spp. (<xref ref-type="bibr" rid="B51">Yang et&#xa0;al., 2019</xref>). Based on the sequencing data, a genome-wide association study was performed on this diversity panel and candidate genes for agronomic traits and disease resistance were identified (<xref ref-type="bibr" rid="B51">Yang et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B50">Yang et&#xa0;al., 2020</xref>).</p>
<p>Despite the progress achieved in the molecular characterization of the WCSRG, genetic integrity of the sugarcane germplasm maintained in this collection has not been systematically analyzed. This is mainly because accurate identification of sugarcane germplasm has been technically challenging, due to the high polyploidy (and aneuploidy) nature of this crop (<xref ref-type="bibr" rid="B4">Brown et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B42">Song et&#xa0;al., 2016</xref>). For any given locus in sugarcane, there can be 8 to 12 alleles in different configurations, which ambiguates genotype identification. Therefore, single-dose molecular markers are needed to distinguish among sugarcane genotypes with complex allele configurations (<xref ref-type="bibr" rid="B42">Song et&#xa0;al., 2016</xref>). Recently, <xref ref-type="bibr" rid="B52">You et&#xa0;al. (2019)</xref> reported the target enrichment sequencing of 300 sugarcane accessions selected from the world collection and developed an Affymetrix Axiom 100K SNP array. This array, which comprises 31,449 single-dose SNPs and 68,648 low-dosage SNPs, provides a powerful tool for using single-dose SNPs in sugarcane germplasm identification.</p>
<p>In this study, we selected 2000 single-dose SNP markers from the Affymetrix Axiom SNP array (<xref ref-type="bibr" rid="B52">You et&#xa0;al., 2019</xref>). After validating the selected candidate SNPs in a pilot study, we selected the final genotyping panel and used it to genotype all the <italic>Saccharum</italic> germplasm, including six <italic>Saccharum</italic> species and hybrids. Through comprehensive genotyping and population structure analyses, we assessed genetic integrity, population structure, and genetic diversity in <italic>Saccharum</italic> germplasm. We identified a high rate of clone mislabeling and redundancy within the sugarcane germplasm collection, characterized by clone duplicate errors, homonymous off-types, and mistakes in species memberships. Moreover, our analyses of population structure and genetic diversity revealed novel insights into the classification and inter-relationships of <italic>Saccharum</italic> species. Overall, these findings provide valuable information for sugarcane research community to improve the accuracy and efficiency of managing and utilizing the sugarcane genetic resources in the WCSRG.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Plant materials</title>
<p>The sugarcane accessions reported in this study are part of the WCSRG, which is curated by the USDA-ARS, SHRS, in Miami, FL. <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref> provides a summary of the geographical distribution of the germplasm accessions. A detailed list of all accessions is provided in <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>. The S. spontaneum accessions are maintained in 7-gallon pots on a concrete pad and not allowed to flower as they are considered invasive. The rest of the accessions are planted in the field and rotated to new field plots every 4 years. The mature plants are cut to the ground every year in the early spring until replanting. The species name of each accession in the WCSRG was defined based on the curator&#x2019;s naming system.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The Geographical origin of 901 <italic>Saccharum</italic> germplasm accessions analyzed in the present study, including <italic>S. spontaneum</italic> (283), <italic>S. robustum</italic> (76), <italic>S. officinarum</italic> (158), <italic>S. barberi</italic> (32), <italic>S. sinense</italic> (46), <italic>S. edule</italic> (3), <italic>Saccharum</italic> spp. (175), Unknown (3), hybrid (123). A detailed list with passport information is presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g001.tif"/>
</fig>
<p>From each sugarcane plant, one fully expanded young leaf was collected into labeled paper envelopes. A total of eight leaf disks were collected using the BioArk Leaf kit provided by LGC, Biosearch Technologies (<ext-link ext-link-type="uri" xlink:href="https://www.biosearchtech.com/">https://www.biosearchtech.com/</ext-link>). The prepared BioArk Leaf kits were then submitted to LGC Genomics (Middleton, WI) for DNA extraction and subsequent genotyping.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>SNP markers, Genotyping and SNP calling</title>
<p>The single-dose markers were initially selected from the Axiom Sugarcane 100K SNP array, which was developed based on five <italic>Saccharum</italic> species (<italic>S. sinense</italic>, <italic>S. barberi</italic>, <italic>S. robustum</italic>, <italic>S. officinarum</italic>, and <italic>S. spontaneum</italic>) and 37 sugarcane hybrids (<xref ref-type="bibr" rid="B52">You et&#xa0;al., 2019</xref>). A set of two thousand bi-allelic and single-dose SNPs were randomly selected from the Axiom Sugarcane 100K SNP array. Probes targeting these SNPs were designed by Biosearch Technologies (<ext-link ext-link-type="uri" xlink:href="https://www.biosearchtech.com">https://www.biosearchtech.com</ext-link>) and used to amplify sugarcane genome DNA libraries, which were then sequenced using the 1x 75 bp Illumina sequencing platform. Reads were trimmed by removing the first 40 bases and quality-checked with a Q value &gt;20. The 2000 candidate SNPs were first evaluated in a pilot study using 196 sugarcane germplasm accessions (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>). Based on call rate, Minor Allele Frequency (MAF), and Linkage Disequilibrium (LD), we then selected a low-density genotyping panel including 400 SNPs and used it to genotype all the <italic>Saccharum</italic> clones including six <italic>Saccharum</italic> species and inter-specific hybrids.</p>
<p>The genotyping was performed using a targeted genotyping-by-sequencing approach called SeqSNP, which has been successfully used in several crops (<xref ref-type="bibr" rid="B54">Zhang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B22">Jo et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B56">Ziarsolo et&#xa0;al., 2021</xref>). Sequence reads were aligned to the sequences (300bp) flanking the SNP markers, using Bowtie2 (version 2.4.5) (<xref ref-type="bibr" rid="B27">Langmead and Salzberg, 2012</xref>). The subsequent alignments (BAM files) were used to call SNP variants by the freebayes program (version 1.1.0) (<xref ref-type="bibr" rid="B15">Garrison and Marth, 2012</xref>) with the following parameters: min-quality 20, &#x2013;min-supporting-allele-qsum 10; &#x2013;read-mismatch-limit 4; &#x2013;mismatch-base-quality-threshold 10; &#x2013;exclude-unobserved-genotypes; &#x2013;no-mnps; &#x2013;no-complex; &#x2013;ploidy 4; &#x2013;min-alternate-fraction.08333; &#x2013;legacy-gls. The called SNP variants (VCF files) were further filtered using the following criteria: 1) SNPs must be biallelic; 2) SNPs must be supported by at least 20 reads, otherwise, they were marked as missing genotypes; 3) both alternative and reference alleles must each be supported by at least 2 reads. After the initial filtering, informative SNPs were selected by excluding SNPs with a missing rate of 10% and a minor allele frequency of &lt;5%. Additionally, samples with 10% or more missing SNP genotyping were also excluded. These filtering processes resulted in a dataset of 357 SNPs and 901 samples for downstream analyses. To assess the degree of variation among SNP markers, genetic parameters such as minor allele frequency (MAF), expected heterozygosity (H<sub>exp</sub>), and observed heterozygosity (H<sub>obs</sub>) for each SNP marker were measured using the R-package snpReady (version 0.9.6) (<xref ref-type="bibr" rid="B16">Granato et&#xa0;al., 2018</xref>).</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Clone mislabeling and genetic redundancy</title>
<p>For this study, we defined three types of problems related to genetic integrity of sugarcane germplasm. The first type was synonymous mislabeling or &#x201c;duplicate error,&#x201d; meaning that sugarcane clones had different names but shared the same SNP genotype. The second was homonymous mislabeling, meaning that individual clones had the same name in this collection, but they had different SNP genotypes. The third type was mistakes, inaccuracies, or a lack of information in species classification, where the species membership of a given clone was wrongfully recorded (<xref ref-type="bibr" rid="B4">Brown et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B51">Yang et&#xa0;al., 2019</xref>).</p>
<p>To identify synonymous mislabeling among sugarcane clones, the allele difference between each pair of individuals was computed using the R-package poppr (<xref ref-type="bibr" rid="B24">Kamvar et&#xa0;al., 2014</xref>). Individuals with zero allele difference at all loci were considered duplicates. The groups of duplicates were visually inspected by constructing a network graph using the R-packages of network and ggplot2. Since genotyping errors are not uncommon, a pair of clones that differ by one or two loci could be the same clone (<xref ref-type="bibr" rid="B23">Kalinowski et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B53">Zhang et&#xa0;al., 2006</xref>). To assess potential genotyping error, we included 12 sugarcane samples in genotyping. These 12 samples were propagated from a single clone &#x201c;P-Mag-84-2&#x201d; (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>) and served as an internal control. Mismatched SNP loci among these 12 samples were calculated and used as a baseline to determine the &#x201c;mismatch threshold&#x201d; for clone identification. Any pair of samples that had mismatched loci below the threshold (near-identical genotypes) were considered as putative duplicates (<xref ref-type="bibr" rid="B53">Zhang et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B2">Akpertey et&#xa0;al., 2021</xref>).</p>
<p>The statistical rigor of duplicate identification was assessed using the probability of identity that two individuals may share the same multilocus genotype by chance (<xref ref-type="bibr" rid="B45">Waits et&#xa0;al., 2001</xref>). The computer program GenAlEx 6.5 (<xref ref-type="bibr" rid="B34">Peakall and Smouse, 2006</xref>; <xref ref-type="bibr" rid="B35">Peakall and Smouse, 2012</xref>) was used to calculate the probability of identity among siblings (PIDsib). PIDsib is defined as the probability that two sibling individuals drawn at random from a population have the same mutilocus genotype (<xref ref-type="bibr" rid="B45">Waits et&#xa0;al., 2001</xref>).</p>
<p>To identify homonymous mislabeling, SNP genotypes of the clones with the same name were manually grouped and compared using multi-locus matching. If the clones differ by more than two loci, then these clones were considered to have different SNP genotypes thus were claimed as homonymous mislabeling.</p>
<p>To identify clones with mistake in species membership, assignment test based on Bayesian clustering analysis of population structure (<xref ref-type="bibr" rid="B38">Pritchard et&#xa0;al., 2000</xref>) was used. Clones with wrongfully assigned species membership were detected and corrected based on the assignment result (see the next section).</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Population structure and genetic diversity</title>
<p>To assess population structure in the collection, we only used accessions with explicit species names recorded in the passport data. Clones recorded as &#x2018;Hybrid&#x2019; or &#x2018;Unknown&#x2019; were excluded in this stage, which led to the retention of 591clones for the population structure analysis. The computer program STRUCTURE ver. 2.3.4 (<xref ref-type="bibr" rid="B38">Pritchard et&#xa0;al., 2000</xref>) was used. The program was run at 10 independent repetitions for population numbers ranging from K = 1 to K = 10, with a burn-in period of 50,000 and 100,000 Markov chain Monte Carlo (MCMC). The optimal number of model components (K) was determined based on delta K (<xref ref-type="bibr" rid="B10">Evanno et&#xa0;al., 2005</xref>). Based on the result, iterative runs were performed on each partitioned cluster to explore the sub-structures within each cluster, as recommended by <xref ref-type="bibr" rid="B10">Evanno et&#xa0;al. (2005)</xref>. Ancestry and admixture proportions were visualized using computer program CLUMPAK (<xref ref-type="bibr" rid="B25">Kopelman et&#xa0;al., 2015</xref>).</p>
<p>Based on the result of the STRUCTURE analysis, clones with the assignment coefficient above 0.80 (Q value &gt;0.80) were considered core members of each cluster and retained for subsequent genetic diversity analysis, including computation of F statistics, Analysis of Molecular Variance (AMOVA), Principal Coordinate Analysis and Neighbor-Joining Clustering Analysis.</p>
<p>AMOVA was performed using the program GenAlex 6.5 (<xref ref-type="bibr" rid="B34">Peakall and Smouse, 2006</xref>; <xref ref-type="bibr" rid="B35">Peakall and Smouse, 2012</xref>). The significance of fixation index (F<sub>ST</sub>) was tested using 999 random permutations. In addition, the F<sub>ST</sub> for each pair of core germplasm groups was calculated and the statistical significance was tested using permutations with the program GenAlEx 6.5.</p>
<p>Key summary statistics including gene diversity (H<sub>exp</sub>) and observed heterozygosity (H<sub>obs</sub>) were calculated for each species using the program GenAlEx 6.5 (<xref ref-type="bibr" rid="B34">Peakall and Smouse, 2006</xref>; <xref ref-type="bibr" rid="B35">Peakall and Smouse, 2012</xref>). To illustrate genetic relationships among the species, a distance-based multivariate analysis was performed. Pairwise genetic distances were computed using the Distance option, and Principal Coordinates Analysis (PCoA) within the GenAlEx 6.5 program. The PCoA results are presented as two-axis PCO plots, and both plots axis 1 vs 2 and axis 1 vs 3 are presented separately.</p>
<p>To further examine the genetic relationship among different species, a neighbor-joining (NJ) clustering analysis was performed. The NJ tree was constructed based on the SNP genotype data using the R-package poppr (<xref ref-type="bibr" rid="B24">Kamvar et&#xa0;al., 2014</xref>). Pairwise genetic distances between the sugarcane clones were estimated and the neighbor-joining method was used to construct the tree. The final tree was visualized using FigTree version1.4.4 (<ext-link ext-link-type="uri" xlink:href="http://tree.bio.ed.ac.uk/software/figtree">http://tree.bio.ed.ac.uk/software/figtree</ext-link>).</p>
<p>To assess species membership and parentage for clones recorded as &#x2018;hybrid&#x2019; or &#x2018;unknown&#x2019;, we used the core members of the five <italic>Saccharum</italic> species as references and increased their samples size to 500 for each species, using the Simulation procedure implemented in the computer program ONCOR (<ext-link ext-link-type="uri" xlink:href="https://www.montana.edu/kalinowski/software/oncor.html">https://www.montana.edu/kalinowski/software/oncor.html</ext-link>). The simulated populations were then analyzed together with the 298 clones with unclarified species membership (clones labeled as &#x2018;unknown&#x2019; or &#x2018;hybrid&#x2019;) using STRUCTURE 2.3.4. An admixed model was selected, and the number of clusters (K value) was set to five, corresponding to the five <italic>Saccharum</italic> species. Ten independent runs were conducted at K = 5, each consisting of 100,000 iterations after a burn-in period of 50,000 iterations. From the 10 independent runs, the mean membership score was presented as the inferred species/parentage or species membership.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Genotyping with SNP markers</title>
<p>After applying an initial filtering process to exclude SNPs and samples with a missing rate of 10% or greater, a total of 751 SNP markers and 901 clones were obtained. Among the <italic>Saccharum</italic> clones, there were 286 <italic>S. spontaneum</italic>, 175 unknown, 158 <italic>S. officinarum</italic>, 123 hybrids, 76 <italic>S. robustum</italic>, 46 <italic>S. sinense</italic>, 32 <italic>S. barberi</italic>, 3 <italic>S. edule</italic>, 1 <italic>S. narenga</italic>, 1 <italic>S. arundinaceum</italic>, as recorded in passport data (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>). Of the SNPs, 217 (29%) were found to be monomorphic. To obtain informative SNP markers, we further filtered out SNPs with a minor allele frequency of less than 5%, resulting in a final set of 357 markers. The final genotype data for these markers showed an average missing rate of 0.15%, ranging from 0 to 7.6%. The sugarcane clones, on the other hand, showed an average missing rate of 0.15%, ranging from 0 to 6.2%. Among the 357 SNP markers, the expected heterozygosity ranged from 0.09 to 0.5, with an average of 0.23. The observed heterozygosity ranged from 0.09 to 0.99 with an average of 0.3. Additionally, the minor allele frequency ranged from 0.05 to 0.5 with an average of 0.153 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S2</bold>
</xref>).</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Clone mislabeling and genetic redundancy in the collection</title>
<p>Clonal propagation and field maintenance of sugarcane germplasm plants can often lead to mislabeling and name loss. The WCSRG, which houses collections from diverse locations worldwide, often encounters duplicated accessions with different regional names but identical clones. To estimate mislabeling and clonal redundancy, we measured the allele difference distance between each pair of sugarcane accessions at all SNP loci. Synonymous groups (duplicates) were determined when clones shared the same alleles at all SNP loci. Our analysis revealed 86 groups of duplicates comprising 211 accessions (23% of the examined <italic>Saccharum</italic> clones), demonstrating a high rate of synonymous mislabeling and genetic redundancy within the collection (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The number of duplicated clones within each group ranged from two to nine clones, with 67 groups consisting of two clones (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>A network representing the genetic relationships among sugarcane clones based on allele difference at the SNP loci. The network was constructed with clones with zero allele difference (identical genotype) where nodes represent clones, and the connections indicate identical genotype between the clones.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g002.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Examples of the identified synonymous mislabeling groups (duplicates) in the <italic>Saccharum</italic> germplasm maintained in the WCSRG.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Group</th>
<th valign="middle" align="left">Clone code</th>
<th valign="middle" align="left">Species</th>
<th valign="middle" align="left">Clone Name</th>
<th valign="middle" align="left">Source of introduction</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="9" align="center">2</td>
<td valign="middle" align="left">SAC0472</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">UBA NAQUIN</td>
<td valign="middle" align="left">US</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0513</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">NEPAL 3</td>
<td valign="middle" align="left">Nepal</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0518</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">CHINA</td>
<td valign="middle" align="left">South Africa</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0519</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">AGAUL</td>
<td valign="middle" align="left">South Africa</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0531</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">TANZHOU</td>
<td valign="middle" align="left">china</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0616</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">MCILKRUM</td>
<td valign="middle" align="left">US</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0670</td>
<td valign="middle" align="left">
<italic>S. barberi</italic>
</td>
<td valign="middle" align="left">Kinar</td>
<td valign="middle" align="left">India</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0711</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">Uba Striped</td>
<td valign="middle" align="left">Unknown</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0760</td>
<td valign="middle" align="left">
<italic>S. sinense</italic>
</td>
<td valign="middle" align="left">Cayana 10</td>
<td valign="middle" align="left">Unknown</td>
</tr>
<tr>
<td valign="middle" rowspan="6" align="center">3</td>
<td valign="middle" align="left">SAC0321</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">IN 84-045</td>
<td valign="middle" align="left">Barbados</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0425</td>
<td valign="middle" align="left">
<italic>S. barberi</italic>
</td>
<td valign="middle" align="left">MESANGEN</td>
<td valign="middle" align="left">Guyana</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0426</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">IN 84-045</td>
<td valign="middle" align="left">Barbados</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0458</td>
<td valign="middle" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="middle" align="left">HORNE</td>
<td valign="middle" align="left">Barbados</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0461</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">NG 28-251</td>
<td valign="middle" align="left">Guadeloupe</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0476</td>
<td valign="middle" align="left">unknown</td>
<td valign="middle" align="left">UNKNOWN</td>
<td valign="middle" align="left">Unknown</td>
</tr>
<tr>
<td valign="middle" rowspan="4" align="center">4</td>
<td valign="middle" align="left">SAC0323</td>
<td valign="middle" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="middle" align="left">NG 28-014 (SS 58-08)</td>
<td valign="middle" align="left">Papua New Guinea</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0436</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">NG 57-208</td>
<td valign="middle" align="left">US</td>
</tr>
<tr>
<td valign="middle" align="left">SAC0447</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">NG 57-208</td>
<td valign="middle" align="left">US</td>
</tr>
<tr>
<td valign="middle" align="left">SAC1234</td>
<td valign="middle" align="left">
<italic>S. robustum</italic>
</td>
<td valign="middle" align="left">NG 57-208</td>
<td valign="middle" align="left">US</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The full list of identified duplicates and near-identical genotypes (clones differing by one or two alleles) was listed in <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>S4</bold>
</xref>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>To estimate genotyping error, twelve clonal samples propagated from a single clone of &#x2018;P-Mag-84-2&#x2019; were included as an internal control. Of the 12 samples, however, only eight samples (Group1 in the <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S3</bold>
</xref>) were identified as duplicates with zero allele difference, while three samples showed one allele difference, and one sample showed two allele differences. These differences were attributed to likely genotyping errors at four loci. Assuming no mutation in the clonal plants, these results indicated an error rate of 0.093% in our genotyping, as four loci were called wrongly out of a total of 4,284 loci in the 12 clonal samples. Based on the observed error rate, we relaxed the threshold of detecting duplicates. Any pair of samples that had up to two allele differences were considered putative duplicates. Based on this relaxed threshold, we identified 135 groups consisting of 471 clones (52% of the total clones) as putative duplicates. The number of duplicated clones within each group ranged from 2 to 38 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>).</p>
<p>The result of duplicate identification was supported by the probability of identity among siblings (PID-sib). The cumulative PID-sib of the first 48 SNPs ranged from 3.85E-04 (<italic>S. robustum</italic>) to 6.73E-07 (<italic>S. officinarum</italic>), which demonstrated that a high level of statistical power can be achieved in sugarcane germplasm analysis using only a small fraction of the 357 SNP markers (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S5</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref>). When all 357 SNP loci were included, the cumulative PID-sib ranged from 2.4E-20 (<italic>S. robustum</italic>) to 7.6E-42 (<italic>S. officinarum</italic>), which indicates that there is almost a null probability of finding two individual clones with the same genotype within any of the five <italic>Saccharum</italic> species.</p>
<p>To identify homonymous mislabeling, clones with the same name were compared for their SNP genotypes using multi-locus matching. A total of 27 homonymous mislabeling groups were detected in all the studied <italic>Saccharum</italic> species, except <italic>S. edule</italic> (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Most of the identified homonymous groups were collected from the same country and geographical region, indicating that mislabeling occurred before the germplasm were introduced into WCSRG.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Identified homonymous mislabeling groups in the <italic>Saccharum</italic> germplasm maintained in the WCSRG.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Homonymous mislabeling group</th>
<th valign="top" align="left">Name</th>
<th valign="top" align="left">Code</th>
<th valign="top" align="left">Species</th>
<th valign="top" align="left">Origin</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">AGOULE</td>
<td valign="top" align="left">SAC0451</td>
<td valign="top" align="left">
<italic>S. sinense</italic>
</td>
<td valign="top" align="left">India Tamil Nadu</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">BA 11569</td>
<td valign="top" align="left">SAC0638</td>
<td valign="top" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="top" align="left">Barbados</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Chino</td>
<td valign="top" align="left">SAC0577</td>
<td valign="top" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">CO 312</td>
<td valign="top" align="left">SAC0636</td>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">South Africa</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">CO 313</td>
<td valign="top" align="left">SAC0635</td>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">South Africa</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">CP 01-1372</td>
<td valign="top" align="left">SAC0552</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="left">Florida</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">CP 91-555</td>
<td valign="top" align="left">SAC0653</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="left">Louisiana</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">F 154</td>
<td valign="top" align="left">SAC0605</td>
<td valign="top" align="left">Hybrid</td>
<td valign="top" align="left">Taiwan</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left">F31-762</td>
<td valign="top" align="left">SAC0608</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">F36-819</td>
<td valign="top" align="left">SAC0299</td>
<td valign="top" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left">HC 71</td>
<td valign="top" align="left">SAC0511</td>
<td valign="top" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="left">IJ 76-414</td>
<td valign="top" align="left">SAC0460</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Barbados</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">IJ 76-478</td>
<td valign="top" align="left">SAC0659</td>
<td valign="top" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="top" align="left">Indonesia</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="left">IJ 76-480</td>
<td valign="top" align="left">SAC0602</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Barbados</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left">IJ 76-547</td>
<td valign="top" align="left">SAC0322</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Guadeloupe</td>
</tr>
<tr>
<td valign="top" align="left">16</td>
<td valign="top" align="left">IN 81-014</td>
<td valign="top" align="left">SAC0328</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Barbados</td>
</tr>
<tr>
<td valign="top" align="left">17</td>
<td valign="top" align="left">Kerah</td>
<td valign="top" align="left">SAC0515</td>
<td valign="top" align="left">
<italic>S. sinense</italic>
</td>
<td valign="top" align="left">Indonesia Java</td>
</tr>
<tr>
<td valign="top" align="left">18</td>
<td valign="top" align="left">Longchuan (Yunan)</td>
<td valign="top" align="left">SAC1228</td>
<td valign="top" align="left">
<italic>S. spontaneum</italic>
</td>
<td valign="top" align="left">China</td>
</tr>
<tr>
<td valign="top" align="left">19</td>
<td valign="top" align="left">MESANGEN</td>
<td valign="top" align="left">SAC0514</td>
<td valign="top" align="left">
<italic>S. barberi</italic>
</td>
<td valign="top" align="left">Guyana</td>
</tr>
<tr>
<td valign="top" align="left">20</td>
<td valign="top" align="left">MOL 6077</td>
<td valign="top" align="left">SAC0481</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">21</td>
<td valign="top" align="left">MOL 6427</td>
<td valign="top" align="left">SAC0569</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">22</td>
<td valign="top" align="left">N 26-14</td>
<td valign="top" align="left">SAC0522</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="left">Unknown</td>
</tr>
<tr>
<td valign="top" align="left">23</td>
<td valign="top" align="left">NG 57-208</td>
<td valign="top" align="left">SAC1234</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Hawaii</td>
</tr>
<tr>
<td valign="top" align="left">24</td>
<td valign="top" align="left">NG 57-238</td>
<td valign="top" align="left">SAC0598</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Barbados</td>
</tr>
<tr>
<td valign="top" align="left">25</td>
<td valign="top" align="left">NG 77-094</td>
<td valign="top" align="left">SAC0396</td>
<td valign="top" align="left">
<italic>S. robustum</italic>
</td>
<td valign="top" align="left">Papua New Guinea</td>
</tr>
<tr>
<td valign="top" align="left">26</td>
<td valign="top" align="left">SES 519</td>
<td valign="top" align="left">SAC218</td>
<td valign="top" align="left">
<italic>S. spontaneum</italic>
</td>
<td valign="top" align="left">India</td>
</tr>
<tr>
<td valign="top" align="left">27</td>
<td valign="top" align="left">Tanzhou</td>
<td valign="top" align="left">SAC0646</td>
<td valign="top" align="left">
<italic>S. sinense</italic>
</td>
<td valign="top" align="left">China Guangxi</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Each of the 27 accessions have at least one homonymous accession with different SNP genotype.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Population structure and genetic diversity</title>
<sec id="s3_3_1">
<label>3.3.1</label>
<title>Bayesian clustering analysis</title>
<p>The results of population structure analysis on 591 clones (with explicit passport records of species names) are presented in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>. According to the delta K method (<xref ref-type="bibr" rid="B10">Evanno et&#xa0;al., 2005</xref>), the most probable number of genetically distinct groups (K) was estimated to be two (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). At K = 2, the <italic>S. spontaneum</italic> clones were clearly classified as a distinct cluster, while the other five species were assigned to the second cluster (shown in orange in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). It&#x2019;s noticeable that majority of the <italic>S. sinense</italic> clones had full population membership of the second cluster (in orange), whereas the majority of the <italic>S. barberi</italic> clones showed admixed genotypes between the first cluster (in blue) and the second cluster (in orange).</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Number of clusters based on the Evanno&#x2019;s Delta K value. <bold>(B)</bold> Population structure of the 591 <italic>Saccharum</italic> germplasm accessions with explicit passport record of species memberships partitioned using Structure v2.3.4. Black vertical lines indicate the separation of the <italic>Saccharum</italic> species. Multiple colors within the genetic group imply admixed individuals under the scenario of K=2.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g003.tif"/>
</fig>
<p>To further explore the substructure in the two clusters (<italic>S. spontaneum</italic> vs. the rest species), we repeated STRUCTURE analysis on each cluster using the same procedure and parameters. Through hierarchical analysis, the most probable number of genetically distinct groups (K) was two in the <italic>S. spontaneum</italic> cluster and four in the rest of the species (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4A, C</bold>
</xref>), based on Evanno&#x2019;s Delta K method. Therefore, the hierarchical partitioning classified the <italic>Saccharum</italic> germplasm into six sub-clusters: the <italic>S. spontaneum</italic> clones were classified into two populations, of which the first population was mainly originated from India and nearby countries in South Asia, whereas the second population were mainly originated from Southeast Asia and Barbados. Hereinafter, we used <italic>S. spontaneum</italic> (India) and <italic>S. spontaneum</italic> (SE Asia) to represent these two populations in subsequent analyses. The other four clusters correspond to four distinguishable species including 1) <italic>S. barberi</italic>, 2) <italic>S. officinarum</italic>, 3) <italic>S. robustum</italic>/<italic>S. edule</italic>, and 4) <italic>S. sinense</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S6</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>
<bold>(A)</bold> Number of clusters in the 273 <italic>S. spontaneum</italic> clones based on the Evanno&#x2019;s Delta K value. <bold>(B)</bold> Partitioned result of the 273 <italic>S. spontaneum</italic> clones at K = 2 using Structure v2.3.4. <bold>(C)</bold> Number of clusters in 299 clones of <italic>S. barberi, S. officinarum, S. robustum/S. edule</italic>, and <italic>S. sinense</italic> based on the Evanno&#x2019;s Delta K value. <bold>(D)</bold> Population structure of the 299 clones of <italic>S. barberi, S. officinarum, S. robustum/S. edule</italic>, and <italic>S. sinense</italic> obtained using Structure v2.3.4. Multiple colors within the genetic group imply admixed individuals.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g004.tif"/>
</fig>
<p>This result is highly compatible with the current taxonomy framework of <italic>Saccharum</italic> (<italic>sensu stricto</italic>), which proposes six <italic>Saccharum</italic> species, with <italic>S. edule</italic> considered as a mutant of <italic>S. robustum</italic> (<xref ref-type="bibr" rid="B5">Daniels and Roach, 1987</xref>). Based on this result, we also observed that many clones had mislabeled species membership. In total, we detected 141 cases of mistakes or inaccuracies in species membership. The largest group was found in <italic>S. officinarum</italic> (65), followed by <italic>S. robustum</italic> (32), <italic>S. sinense</italic> (16) and <italic>S. barberi</italic> (12). In contrast, only one clone of <italic>S. spontaneum</italic> was found to have mislabeled species membership (&#x201c;IN 84-072&#x201d; from Indonesia), in addition to 10 clones of hybrids derived from <italic>S. spontaneum</italic> (<xref ref-type="fig" rid="f4">
<bold>Figures&#xa0;4B, D</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S6</bold>
</xref>).</p>
<p>To further understand the genetic relationships among the five <italic>Saccharum</italic> species, we selected the core members of each species, based on the membership coefficient (Q-value) generated by the STRUCTURE analysis, with the threshold &#x2265; 0.80 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S6</bold>
</xref>). This stringent cutoff enabled the inclusion of clones with minimal admixture. A total of 412 core members with unique genotypes were retained and each clone had a unique SNP genotype. These 412 core members were used in subsequent analysis of genetic diversity, including PCoA, Neighbor-Joining clustering analyses and AMOVA.</p>
</sec>
<sec id="s3_3_2">
<label>3.3.2</label>
<title>Principal Coordinates Analysis</title>
<p>The PCoA based on the Euclidean distance provided additional information on the relationships among the <italic>Saccharum</italic> germplasm clones (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). The first three principal coordinates accounted for 42.7% of the total variation, with the first, second and third coordinates explaining 21.7%, 13.0%, and 8.0%, respectively. Consistent with the findings from the STRUCTURE analysis, the core members of the five species were clearly separated from each other in both <xref ref-type="fig" rid="f5">
<bold>Figures&#xa0;5A, B</bold>
</xref>.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>PCoA plots of the five <italic>Saccharum</italic> species represented by 412 core members with unique genotypes. <bold>(A)</bold> coordinates 1 vs 2 and <bold>(B)</bold> coordinates 2 vs 3. The analysis includes clones classified by STRUCTURE analysis with Q value &gt;0.80. Each point represents an individual clone. The first three main axes accounted for the following percentages of the total variation: first axis = 21.7%, second axis = 13.0% and third axis = 8.0%.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g005.tif"/>
</fig>
</sec>
<sec id="s3_3_3">
<label>3.3.3</label>
<title>Neighbor-Joining clustering analysis</title>
<p>The Neighbor-Joining tree (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>) revealed consistent results with STRUCTURE (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>) and PCoA analyses (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). There were two main clusters in the core members of the five species. Cluster 1 consisted of <italic>S. officinarum</italic>, <italic>S. robustum</italic>, <italic>S. barberi</italic>, and <italic>S. sinense</italic>, while Cluster 2 included the two populations of <italic>S. spontaneum</italic> from India and Southeast Asia. Within Cluster 1, <italic>S. officinarum</italic> and <italic>S. robustum</italic> were grouped together, showing their close relationship (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Neighbor-Joining tree depicting the relationships among the five <italic>Saccharum</italic> species represented by 412 core members with unique genotypes. The species <italic>S. spontaneum</italic> included two populations from India and Southeast Asia.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1337736-g006.tif"/>
</fig>
</sec>
<sec id="s3_3_4">
<label>3.3.4</label>
<title>F statistics and Analysis of Molecular variance</title>
<p>The pattern of genetic differentiation between the five sugarcane species was also reflected by pairwise F<sub>ST</sub> values, where higher F<sub>ST</sub> values indicate greater genetic differentiation (<xref ref-type="bibr" rid="B48">Weir and Hill, 2002</xref>). The lowest pairwise F<sub>ST</sub> values (0.073) was found between the two <italic>S. spontaneum</italic> populations (India vs. Southeast Asia), indicating a low level of differentiation. Among the five species, the pairwise F<sub>ST</sub> ranged from 0.103 (<italic>S. officinarum vs S. barberi</italic>) to 0.323 (<italic>S. robustum</italic> vs <italic>S. sinense</italic>) (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). The pairwise F<sub>ST</sub> values generally align with the results from the PCoA plot (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>) and the phylogenetic tree (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). All F<sub>ST</sub> were highly significant (P &lt; 0.001) based on permutation test. However, it&#x2019;s noteworthy that <italic>S. sinense</italic> was found to have the highest mean F<sub>ST</sub> value (0.239), followed by <italic>S. robustum</italic> (0.224), <italic>S. barberi</italic> (0.178), <italic>S. spontaneum</italic> (0.176) and <italic>S. officinarum</italic> (0.123).</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Pairwise population F<sub>ST</sub> analysis among the five <italic>Saccharum</italic> species, represented by 412 core members with unique genotypes.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Species</th>
<th valign="middle" align="left">
<italic>S. barberi</italic>
</th>
<th valign="middle" align="left">
<italic>S. robustum</italic>
</th>
<th valign="middle" align="left">
<italic>S. officinarum</italic>
</th>
<th valign="middle" align="left">
<italic>S. sinense</italic>
</th>
<th valign="bottom" align="left">
<italic>S. spontaneum</italic> (SE Asia)</th>
<th valign="bottom" align="left">
<italic>S. spontaneum</italic> (India)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="bottom" align="left">
<italic>S. barberi</italic>
</td>
<td valign="bottom" align="left">0.000</td>
<td valign="bottom" align="left">0.248</td>
<td valign="bottom" align="left">0.103</td>
<td valign="bottom" align="left">0.204</td>
<td valign="bottom" align="left">0.161</td>
<td valign="bottom" align="left">0.176</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. robustum</italic>
</td>
<td valign="bottom" align="left">0.248</td>
<td valign="bottom" align="left">0.000</td>
<td valign="bottom" align="left">0.107</td>
<td valign="bottom" align="left">0.323</td>
<td valign="bottom" align="left">0.218</td>
<td valign="bottom" align="left">0.224</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="bottom" align="left">0.103</td>
<td valign="bottom" align="left">0.107</td>
<td valign="middle" align="left">0.000</td>
<td valign="middle" align="left">0.168</td>
<td valign="middle" align="left">0.119</td>
<td valign="middle" align="left">0.120</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. sinense</italic>
</td>
<td valign="bottom" align="left">0.204</td>
<td valign="bottom" align="left">0.323</td>
<td valign="middle" align="left">0.168</td>
<td valign="bottom" align="left">0.000</td>
<td valign="bottom" align="left">0.216</td>
<td valign="bottom" align="left">0.286</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum</italic> (SE Asia)</td>
<td valign="bottom" align="left">0.161</td>
<td valign="bottom" align="left">0.218</td>
<td valign="middle" align="left">0.119</td>
<td valign="bottom" align="left">0.216</td>
<td valign="middle" align="left">0.000</td>
<td valign="middle" align="left">0.073</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum</italic> (India)</td>
<td valign="bottom" align="left">0.176</td>
<td valign="bottom" align="left">0.224</td>
<td valign="middle" align="left">0.120</td>
<td valign="bottom" align="left">0.286</td>
<td valign="middle" align="left">0.073</td>
<td valign="middle" align="left">0.000</td>
</tr>
<tr>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left">0.178</td>
<td valign="bottom" align="left">0.224</td>
<td valign="bottom" align="left">0.123</td>
<td valign="bottom" align="left">0.239</td>
<td valign="bottom" align="left">0.157</td>
<td valign="bottom" align="left">0.176</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The probability, P (rand &gt;= data) based on 999 permutations is shown above the diagonal.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>AMOVA was employed to assess the distribution of the observed genetic variance among the five sugarcane species, excluding hybrids and unknown species. The results showed that a substantial proportion of the total genetic variation (85%) was attributed to within-species variation, while the remaining 15% of the total genetic variance was found in variation between species (<xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>). This shows that the observed genetic variations primarily arise from variation among individual clones within species rather than between different species. Out of the five species, <italic>S. officinarum</italic> has the highest intra-specific molecular variance (46.1), indicating its status as a cultivated hybrid species with extensive gene introgressions. In contrast, <italic>S. robustum</italic> had the lowest intra-specific molecular variance (21.8), suggesting its status as an ancient species with limited inter-specific gene flow. Intra-specific molecular variance in <italic>S. spontaneum</italic>, <italic>S. barberi</italic> and <italic>S. sinense</italic> are comparable. It&#x2019;s noticeable that within <italic>S. spontaneum</italic>, the population from Southeast Asia had higher molecular variance (35.0) than the population from India (30.8).</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>AMOVA and partitioning of total molecular variance within and among the five <italic>Saccharum</italic> species represented by 412 core members with unique genotypes.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" align="left">Source</th>
<th valign="bottom" align="left">df</th>
<th valign="bottom" align="left">SS</th>
<th valign="bottom" align="left">MS</th>
<th valign="bottom" align="left">Est. Var.</th>
<th valign="bottom" align="left">%</th>
<th valign="bottom" align="left">P value</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="bottom" align="left">Among Pops</td>
<td valign="bottom" align="left">5</td>
<td valign="bottom" align="left">4310.9</td>
<td valign="bottom" align="left">862.2</td>
<td valign="bottom" align="left">6.4</td>
<td valign="bottom" align="left">15%</td>
<td valign="bottom" align="left">&lt;0.001</td>
</tr>
<tr>
<td valign="bottom" align="left">Within Pops</td>
<td valign="bottom" align="left">818</td>
<td valign="bottom" align="left">28509.8</td>
<td valign="bottom" align="left">34.9</td>
<td valign="bottom" align="left">34.9</td>
<td valign="bottom" align="left">85%</td>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. barberi</italic>
</td>
<td valign="bottom" align="left">37</td>
<td valign="bottom" align="left">1257.5</td>
<td valign="bottom" align="left">34.0</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. robustum</italic>
</td>
<td valign="bottom" align="left">123</td>
<td valign="bottom" align="left">2682.6</td>
<td valign="bottom" align="left">21.8</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="bottom" align="left">207</td>
<td valign="bottom" align="left">9543.0</td>
<td valign="bottom" align="left">46.1</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. sinense</italic>
</td>
<td valign="bottom" align="left">55</td>
<td valign="bottom" align="left">2000.1</td>
<td valign="bottom" align="left">36.4</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum</italic> (S.E. Asia)</td>
<td valign="bottom" align="left">197</td>
<td valign="bottom" align="left">6898.5</td>
<td valign="bottom" align="left">35.0</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum</italic> (India)</td>
<td valign="bottom" align="left">199</td>
<td valign="bottom" align="left">6128.1</td>
<td valign="bottom" align="left">30.8</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left"/>
</tr>
<tr>
<td valign="bottom" align="left">Total</td>
<td valign="bottom" align="left">823</td>
<td valign="bottom" align="left">32820.7</td>
<td valign="bottom" align="left"/>
<td valign="bottom" align="left">41.2</td>
<td valign="bottom" align="left">100%</td>
<td valign="bottom" align="left"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*Probability, P (rand &gt;= data), for F<sub>ST</sub> is based on standard permutation across the full data set.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_3_5">
<label>3.3.5</label>
<title>Observed heterozygosity and genetic diversity</title>
<p>
<italic>S. spontaneum</italic> and <italic>S. robustum</italic> are considered as wild sugarcane species (<xref ref-type="bibr" rid="B9">Dinesh Babu et&#xa0;al., 2022</xref>). It is interesting to find that these two species exhibited relatively lower gene diversity and higher homogeneity compared to other cultivated species (<xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>). Notably, <xref ref-type="bibr" rid="B55">Zhang et&#xa0;al. (2018)</xref> also reported low gene diversity across 64 <italic>S. spontaneum</italic> accessions, based on genome sequencing data. They showed that the nucleotide diversity was much lower than that of other clonally propagated crops such as potato, cassava, grape, and citrus. Modern sugarcane cultivars have been extensively developed through interspecific crosses between <italic>S. spontaneum</italic> and <italic>S. officinarum</italic>. This disparity between wild and cultivated accessions suggests that the lower gene diversity observed in <italic>S. spontaneum</italic> is a characteristic of natural populations without human intervention. In contrast, the extensive intercrossing between species has likely contributed to the increased gene diversity and heterozygosity in hybrid cultivars.</p>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Sample size (N), Observed heterozygosity (H<sub>obs</sub>) and Gene diversity (H<sub>exp</sub>) in the five <italic>Saccharum</italic> species represented by 412 core members.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="bottom" align="left">Species</th>
<th valign="bottom" align="left">N</th>
<th valign="bottom" colspan="2" align="center">H<sub>obs</sub>
</th>
<th valign="bottom" colspan="2" align="center">H<sub>exp</sub>
</th>
</tr>
<tr>
<th valign="bottom" align="left"/>
<th valign="bottom" align="left"/>
<th valign="bottom" align="left">Mean</th>
<th valign="bottom" align="left">SE</th>
<th valign="bottom" align="left">Mean</th>
<th valign="bottom" align="left">SE</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="bottom" align="left">
<italic>S. barberi</italic>
</td>
<td valign="bottom" align="left">19</td>
<td valign="bottom" align="left">0.302</td>
<td valign="bottom" align="left">0.020</td>
<td valign="bottom" align="left">0.183</td>
<td valign="bottom" align="left">0.011</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. robustum</italic>
</td>
<td valign="bottom" align="left">62</td>
<td valign="bottom" align="left">0.162</td>
<td valign="bottom" align="left">0.014</td>
<td valign="bottom" align="left">0.114</td>
<td valign="bottom" align="left">0.009</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. officinarum</italic>
</td>
<td valign="bottom" align="left">104</td>
<td valign="bottom" align="left">0.354</td>
<td valign="bottom" align="left">0.014</td>
<td valign="bottom" align="left">0.256</td>
<td valign="bottom" align="left">0.008</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. sinense</italic>
</td>
<td valign="bottom" align="left">28</td>
<td valign="bottom" align="left">0.389</td>
<td valign="bottom" align="left">0.025</td>
<td valign="bottom" align="left">0.199</td>
<td valign="bottom" align="left">0.013</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum (SEA)</italic>
</td>
<td valign="bottom" align="left">99</td>
<td valign="bottom" align="left">0.285</td>
<td valign="bottom" align="left">0.017</td>
<td valign="bottom" align="left">0.193</td>
<td valign="bottom" align="left">0.010</td>
</tr>
<tr>
<td valign="bottom" align="left">
<italic>S. spontaneum (India)</italic>
</td>
<td valign="bottom" align="left">100</td>
<td valign="bottom" align="left">0.238</td>
<td valign="bottom" align="left">0.015</td>
<td valign="bottom" align="left">0.169</td>
<td valign="bottom" align="left">0.009</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Inferred species membership and parentage for clones with missing passport information</title>
<p>Of the 901 <italic>Saccharum</italic> (<italic>sensu stricto</italic>) accessions maintained in this sugarcane germplasm collection, there were 175 clones that do not have clear passport data for their species membership. These clones were recorded as &#x2018;unknown&#x2019; in the collection. In addition, there were 123 clones recorded as &#x2018;Hybrid&#x2019;, but their parentage information was lacking. Using the selected core members of the five <italic>Saccharum</italic> species as references, we were able to assign the species membership and parentage for all the clones that have ambiguous passport records. Our result showed that most of these clones have a species membership of <italic>S. officinarum</italic> (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S8</bold>
</xref>). Among the 175 clones recorded as &#x2018;unknown&#x2019;, two were assigned to <italic>S. barberi</italic>, 12 to <italic>S. sinense</italic>, 12 to <italic>S. spontaneum</italic>, 10 to <italic>S. robustum</italic>, 91 to <italic>S. officinarum</italic>, and 40 to inter-specific hybrids. Similarly, among the 123 clones that were recorded as &#x2018;Hybrid&#x2019;, two were assigned to <italic>S. spontaneum</italic>, one to <italic>S. robustum</italic>, 96 to <italic>S. officinarum</italic>, and 24 to inter-specific hybrid (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S9</bold>
</xref>).</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Genetic integrity is crucial for efficient conservation and use of plant germplasm for genetic improvement. This is particularly the case for many tropical/subtropical crops such as sugarcane, which is typically maintained in the field and propagated clonally, a process that can often result in mislabeling or loss of identifiers . Moreover, complex hybridization among sugarcane species further complicates the germplasm identification and highlights the need for comprehensive molecular and morphological characterization. However, accurate identification of sugarcane germplasm has been technically challenging, due to the high polyploidy (and aneuploidy) nature of this crop. In this study, we selected single-dose SNP markers and employed a targeted genotyping-by-sequencing (Seq-SNP) method to assess clone identity, population structure and genetic diversity in the <italic>Saccharum</italic> germplasm maintained in the WCSRG. This approach was chosen for its compatibility with sugarcane&#x2019;s diverse ploidy levels and large genome. The single-dose SNP markers offers advantages for polyploid plants such as sugarcane by enabling the identification and differentiation of alleles present across multiple sets of chromosomes without the need of ploidy determination (<xref ref-type="bibr" rid="B43">Sorrells, 1992</xref>; <xref ref-type="bibr" rid="B1">Aitken, 2022</xref>). By employing this high-throughput genotyping technique, we significantly improved our understanding of the genetic integrity and species relationship of sugarcane germplasm. The result provided valuable information to ensure the accuracy and efficiency in managing the sugarcane collection and facilitate its utilization in breeding programs.</p>
<sec id="s4_1">
<label>4.1</label>
<title>Clone mislabeling and genetic redundancy</title>
<p>Using the selected SNP markers, we genotyped 901 <italic>Saccharum</italic> clones from six species including hybrids. Based on the SNP genotypes, we discovered a high rate of clone mislabeling and genetic redundancy within the studied sugarcane collection. Because genotyping errors frequently occur, a pair of clones with a small number of mismatched loci could be duplicates as well (<xref ref-type="bibr" rid="B53">Zhang et&#xa0;al., 2006</xref>). Therefore, a threshold of mismatches to determine duplicates needs to be established. To evaluate the genotyping error rate, we included 12 samples propagated from the same clone as an internal control. Among the 12 samples, eight samples exhibited zero allele difference, while three samples showed one allele difference, and one sample showed two allele differences, suggesting that a two-allele difference could be used as the threshold for duplicate identification. Based on this threshold, we found that that half of the clones had at least one other clone with up to a two-allele difference (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S4</bold>
</xref>). We assessed how many SNP markers are needed to provide sufficient statistical power for sugarcane duplicate identification. Based on the cumulative PID-sib values for each species, we demonstrated that when utilizing 48 SNPs, the probability that two sibling individuals may share the same multilocus genotype by chance (<xref ref-type="bibr" rid="B45">Waits et&#xa0;al., 2001</xref>) was smaller than 0.001 (PIDsib &lt;0.001) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S8</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref>). Therefore, the panel of 357 SNPs is far more than sufficient to identify synonymously mislabeled clones in each species (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S5</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Figure S1</bold>
</xref>).</p>
<p>In addition to the detection of synonymous groups, the single-dose SNP genotyping enabled the identification of 27 homonymous mislabeling groups (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>), where clones with the same name had different SNP genotypes. These homonymous mislabeling groups were detected in all five <italic>Saccharum</italic> species, often in germplasm accessions collected from the same geographical region. For example, the three clones of &#x201c;AGOULE&#x201d; were all collected from Tamil Nadu, India. However, they exhibited two different SNP genotypes. In another case, two clones were labeled as &#x201c;Chino&#x201d;, both from Hawaii, but their SNP genotypes were different. A more noteworthy example is the two &#x201c;Uba&#x201d; clones from India. Although they were both classified correctly as <italic>S. sinense</italic>, they had different SNP genotypes. Since &#x201c;Uba&#x201d; has been widely used as an important source of disease resistance in sugarcane breeding, the identified homonymous mislabeling has significant implications on sugarcane genetic studies and new variety development.</p>
<p>Furthermore, a high rate of mislabeling and inaccuracies was also detected in recorded species membership. Most of the mislabeling and inaccuracies occurred in species pairs that shared morphological similarities, such as <italic>S. officinarum</italic> vs <italic>S. robustum</italic> and <italic>S. barberi</italic> vs <italic>S. sinense</italic>. In contrast, there was almost no mislabeling of species membership between <italic>S. spontaneum</italic> and the rest of species. The high rate of mislabeling revealed in the present study was likely due to sugarcane&#x2019;s feature as a clonally propagated crop, which has allowed the exchange of sugarcane germplasm as clones among regions, countries, and continents. However, passport data, such as records and labels of the germplasm have not always followed the same naming conventions, leading to limited information about their correct identity. In fact, the majority of mislabeling and redundancy were observed in cultivated species, indicating a more intensive exchange of cultivated germplasm than wild species. Additional efforts of characterization are needed to fully resolve the mislabeling problem. SNP profiles for reference sugarcane clones need to be established through international collaboration. The putative mislabeled clones need to be compared with established references to correct the mislabeling errors. For the putative duplicate groups with near-identical genotypes, SNP genotyping will need to be repeated to confirm their clone identity. Moreover, since somaclonal mutation can occur in sugarcane, phenotypic examination remains essential to complement the result of molecular characterization.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Population structure and relationships among <italic>saccharum</italic> species</title>
<p>The sugarcane research community usually regarded <italic>Saccharum</italic> (<italic>sensu stricto</italic>) as containing six species, including two wild species (<italic>S. spontaneum</italic> and <italic>S. robustum</italic>), and four cultivated species - <italic>S. officinarum</italic>, <italic>S. edule</italic>, <italic>S. barberi</italic>, and <italic>S. sinense</italic> (<xref ref-type="bibr" rid="B39">Purseglove, 1972</xref>; <xref ref-type="bibr" rid="B5">Daniels and Roach, 1987</xref>; <xref ref-type="bibr" rid="B18">Grivet et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B20">Hemaprabha et&#xa0;al., 2022</xref>). The present study, using both model-based clustering and multivariant analysis based on 357 single dose SNP makers, supported the current classification of <italic>Saccharum</italic> germplasm. The only exception is <italic>S. edule</italic>, which could not be differentiated from <italic>S. robustum</italic>. <italic>S. edule</italic> is cultivated in New Guinea and nearby islands for its aborted edible inflorescences. Our result is consistent with the hypothesis that <italic>S. edule</italic> is a small group of sterile mutants that originated from <italic>S. robustum</italic> (<xref ref-type="bibr" rid="B39">Purseglove, 1972</xref>; <xref ref-type="bibr" rid="B17">Grivet et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B18">Grivet et&#xa0;al., 2006</xref>).</p>
<p>The present study also showed that <italic>S. spontaneum</italic> is a well-differentiated wild species, as shown by the analytical results of STRUCTURE (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), PCoA (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>) and the NJ-tree (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). This observation is consistent with previous reports based on SSR markers (<xref ref-type="bibr" rid="B4">Brown et&#xa0;al., 2007</xref>), genome re-sequencing data (<xref ref-type="bibr" rid="B51">Yang et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B13">Fickett et&#xa0;al., 2020</xref>), and plastid genome sequences (<xref ref-type="bibr" rid="B11">Evans and Joshi, 2016</xref>). In the present study, we found very few mislabeling between <italic>S. spontaneum</italic> and the other four species. Nonetheless, the result of the hierarchical STRUCTURE analysis on <italic>S. spontaneum</italic> showed that there were two sub-groups within this species (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A, B</bold>
</xref>). The first sub-group was mainly from India and south Asia, whereas the second sub-group was dominantly from Southeast Asia countries (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S6</bold>
</xref>). This result agrees with the recent report of <xref ref-type="bibr" rid="B37">Pompidor et&#xa0;al. (2021)</xref> and further indicates the importance of maintaining differentiated populations based on broader geographical regions.</p>
<p>A close genetic relationship was observed between <italic>S. robustum</italic> and <italic>S. officinarum</italic>. This observation is consistent with the recent finding of <xref ref-type="bibr" rid="B37">Pompidor et&#xa0;al. (2021)</xref>, which suggested that both <italic>S. officinarum</italic> and <italic>S. robustum</italic> were derived from the same two ancestral genomes (A and B genomes), indicating a common origin of both species. Nonetheless, our result showed that the two species could be clearly differentiated at the molecular level, as demonstrated by the results of STRUCTURE (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>), PCoA (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>) and NJ tree (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>).</p>
<p>
<italic>S. barberi</italic> and <italic>S. sinense</italic> are two cultivated species that are closely related (<xref ref-type="bibr" rid="B39">Purseglove, 1972</xref>; <xref ref-type="bibr" rid="B29">Lu et&#xa0;al., 1994</xref>; <xref ref-type="bibr" rid="B20">Hemaprabha et&#xa0;al., 2022</xref>). However, the taxonomy status, as well as the relationship between these two species, has been a subject of debate. It was proposed that <italic>S. officinarum</italic> hybridized with <italic>S. spontaneum</italic> in Asia continental and the hybrid progenies developed into <italic>S. barberi</italic> in India and <italic>S. sinense</italic> in China (<xref ref-type="bibr" rid="B3">Brandes, 1956</xref>; <xref ref-type="bibr" rid="B5">Daniels and Roach, 1987</xref>; <xref ref-type="bibr" rid="B8">D&#x2019;Hont et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B28">Li et&#xa0;al., 2022</xref>). The geographical barrier (Southern China for <italic>C. sinensis</italic> vs. Northern India for <italic>C. barberi</italic>) could played significant role in the genetic differentiation of these two species. Using target enrichment sequencing of 307 germplasm accessions from WCSRG, <xref ref-type="bibr" rid="B51">Yang et&#xa0;al. (2019)</xref> showed that <italic>S. sinense</italic> and <italic>S. barberi</italic> were different in terms of genome compositions and potential ancestor accessions. Our result showed that <italic>S. barberi</italic> had the closest relationship with <italic>S. officinarum</italic>, which supported the proposal that <italic>S. barberi</italic> is a hybrid of <italic>S. officinarum</italic> and <italic>S. spontaneum</italic>. However, the present result also showed that relative to <italic>S. barberi</italic>, <italic>S. sinense</italic> had a larger genetic differentiation from <italic>S. officinarum</italic> and <italic>S. spontaneum</italic> (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). Nonetheless, the number of samples of <italic>S. barberi</italic> and <italic>S. sinense</italic> used in the present study is relatively small. A systematic collection of samples representing the full geographical range of these two species is needed for a comprehensive analysis of population structure and genetic diversity in these two species.</p>
<p>To elucidate the underlying patterns of genetic variation in the sugarcane population, we conducted AMOVA to partition the observed variation among sugarcane clones. According to the AMOVA results, a significant proportion of the observed genetic diversity was attributed to variation among individual clones, accounting for 85% of the total variation, while the remaining 15% of the variation was attributed to variation between species (<xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>). These results are consistent with previous studies (<xref ref-type="bibr" rid="B32">Nayak et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B30">Manechini et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B13">Fickett et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B41">Singh et&#xa0;al., 2020</xref>), indicating that the primary source of genetic diversity resides within species rather than between different species. The relatively low percentage of genetic variation between species suggests that there may be a considerable level of introgression and systematic crossing occurring between different sugarcane species, reflecting intercrossing nature among sugarcane species (<xref ref-type="bibr" rid="B31">Moore et&#xa0;al., 2013</xref>). In all species, the observed heterozygosity was higher than the expected heterozygosity, which suggests more intercrosses between isolated populations than the founders. The inter-specific gene flow in sugarcane is well-supported by historical accounts that, throughout the seventeenth, eighteenth, and nineteen centuries, there was an extensive exchange of varieties among the sugarcane planters worldwide (<xref ref-type="bibr" rid="B47">Warner, 1962</xref>). The development of improved cultivars involved frequent intercrossing between the species, which also likely contributed to the low genetic variation between species. This is supported by the observed heterozygosity exceeding Hardy-Weinberg expectations, suggesting a greater number of intercrosses than expected from the founders alone.</p>
<p>In conclusion, accurate germplasm identity is critical for efficient management of sugarcane germplasm. Using single-dose SNP markers, we genotyped all the <italic>Saccharum</italic> clones in WCSRG, maintained at USDA-ARS. The single-dose SNP genotypes enabled us to detect a high rate of mislabeling and genetic redundancy in this collection. In addition, an analysis of population structure using both ordination and model-based clustering, revealed five genetic groups in the <italic>Saccharum</italic> germplasm, corresponding to <italic>S. barberi, S. robustum, S. officinarum, S. sinense, and S. spontaneum</italic>. The pattern of genetic structure in the <italic>Saccharum</italic> gene pool suggested a high level of gene flow among sugarcane species and across different geographical regions, likely facilitated by human intervention, as evident from the lower genetic variation observed between species. This extensive germplasm exchange, predominantly as clonal material, may contribute to the mislabeling and redundancy observed within the sugarcane collections. Through comprehensive analyses of genetic identity, we were able to detect genetic redundancy in the collection. Furthermore, we assessed the ancestral species/populations among the <italic>Saccharum</italic> germplasm clones and ascertained the presence of core members in each species. Using these core members as references, we were able to correct mistakes and/or inaccuracy in species membership, as well as clarify the parentage for hybrid clones. The corrected mislabeling in species membership needs to be validated based on phenotypic characteristics. Our results ensured that the preserved clones in the WCSRG have distinct genetic makeup. This is the first time that a large germplasm collection of sugarcane&#x2014;a complicated polyploidy crop - was systematically characterized in terms of clone integrity and genetic redundancy. The single-dose SNP markers developed by this study offer a powerful tool for characterizing sugarcane germplasm worldwide. These markers can also be potentially used for identifying chromosomes. The reported findings have important implications for sugarcane genebank management, germplasm exchange, and crop genetic improvement.</p>
</sec>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The genomic DNA sequencing data are accessible in the Sequence Read Archive (SRA) under bioproject ID PRJNA1051683 (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/bioproject">http://www.ncbi.nlm.nih.gov/bioproject</ext-link>).</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>SP: Formal analysis, Investigation, Methodology, Software, Validation, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. DZ: Conceptualization, Formal analysis, Funding acquisition, Investigation, Methodology, Resources, Software, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. GA: Conceptualization, Data curation, Investigation, Methodology, Project administration, Resources, Supervision, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This research was funded by appropriated funds from the United States Department of Agriculture, Agricultural Research Service (USDA-ARS) (Project Number: 6038-21000-024-00D and 8042-21000-303-000-D.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We are grateful to Dr. Aliya Momotaz and Dr. Md. Sariful Islam, United States Department of Agriculture, Agriculture Research Service, Sugarcane Field Station, Canal Point, Florida, for critically reading the manuscript. Help of Barbara Freeman, Douglas DeStefano and Brandon Rodriguez with collecting leaf samples is appreciated. Mention of a trade name, proprietary product, or vendor does not constitute an endorsement, guarantee, or warranty by the USDA and does not imply its approval to the exclusion of other products or vendors that may be suitable.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1337736/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1337736/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table_1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Aitken</surname> <given-names>K. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>History and development of molecular markers for sugarcane breeding</article-title>. <source>Sugar Tech</source> <volume>24</volume>, <fpage>341</fpage>&#x2013;<lpage>353</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12355-021-01000-7</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Akpertey</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Padi</surname> <given-names>F. K.</given-names>
</name>
<name>
<surname>Meinhardt</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Effectiveness of single nucleotide polymorphism markers in genotyping germplasm collections of coffea canephora using KASP assay</article-title>. <source>Front. Plant Sci.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2020.612593</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brandes</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>1956</year>). <article-title>Origin, dispersal and use in breeding of the Melanesian garden sugarcane and their derivatives, Saccharum officinarum L</article-title>. <source>Proc. Int. Soc. Sugar Cane Technol.</source> <volume>9</volume>, <fpage>709</fpage>&#x2013;<lpage>750</lpage>.</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>Schnell</surname> <given-names>R. J.</given-names>
</name>
<name>
<surname>Power</surname> <given-names>E. J.</given-names>
</name>
<name>
<surname>Douglas</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Kuhn</surname> <given-names>D. N.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Analysis of clonal germplasm from five Saccharum species: S. barberi, S. robustum, S. officinarum, S. sinense and S. spontaneum. A study of inter- and intra species relationships using microsatellite markers</article-title>. <source>Genet. Resour. Crop Evol.</source> <volume>54</volume>, <fpage>627</fpage>&#x2013;<lpage>648</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10722-006-0035-z</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Daniels</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Roach</surname> <given-names>B. T.</given-names>
</name>
</person-group> (<year>1987</year>). &#x201c;<article-title>Chapter 2 - taxonomy and evolution</article-title>,&#x201d; in <source>Developments in crop science sugarcane improvement through breeding</source>. Ed. <person-group person-group-type="editor">
<name>
<surname>Heinz</surname> <given-names>D. J.</given-names>
</name>
</person-group> (<publisher-loc>New York</publisher-loc>: <publisher-name>Elsevier</publisher-name>), <fpage>7</fpage>&#x2013;<lpage>84</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/B978-0-444-42769-4.50007-2</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deren</surname> <given-names>C. W.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Genetic base of U.S. Mainland sugarcane</article-title>. <source>Crop Sci.</source> <volume>35</volume>, <elocation-id>cropsci1995.0011183X003500040047x</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci1995.0011183X003500040047x</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Grivet</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Feldmann</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Rao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Berding</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Glaszmann</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Characterisation of the double genome structure of modern sugarcane cultivars (Saccharum spp.) by molecular cytogenetics</article-title>. <source>Mol. Gen. Genet. MGG</source> <volume>250</volume>, <fpage>405</fpage>&#x2013;<lpage>413</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02174028</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Paulet</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Glaszmann</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Oligoclonal interspecific origin of &#x2018;North Indian&#x2019; and &#x2018;Chinese&#x2019; sugarcanes</article-title>. <source>Chromosome Res.</source> <volume>10</volume>, <fpage>253</fpage>&#x2013;<lpage>262</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1015204424287</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dinesh Babu</surname> <given-names>K. S.</given-names>
</name>
<name>
<surname>Janakiraman</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Palaniswamy</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Kasirajan</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Gomathi</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Ramkumar</surname> <given-names>T. R.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A short review on sugarcane: its domestication, molecular manipulations and future perspectives</article-title>. <source>Genet. Resour. Crop Evol.</source> <volume>69</volume>, <fpage>2623</fpage>&#x2013;<lpage>2643</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10722-022-01430-6</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evanno</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Regnaut</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Goudet</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Detecting the number of clusters of individuals using the software STRUCTURE: a simulation study</article-title>. <source>Mol. Ecol.</source> <volume>14</volume>, <fpage>2611</fpage>&#x2013;<lpage>2620</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-294X.2005.02553.x</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evans</surname> <given-names>D. L.</given-names>
</name>
<name>
<surname>Joshi</surname> <given-names>S. V.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Complete chloroplast genomes of Saccharum spontaneum, Saccharum officinarum and Miscanthus floridulus (Panicoideae: Andropogoneae) reveal the plastid view on sugarcane origins</article-title>. <source>Syst. Biodivers.</source> <volume>14</volume>, <fpage>548</fpage>&#x2013;<lpage>571</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/14772000.2016.1197336</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="web">
<person-group person-group-type="author">
<collab>FAO</collab>
</person-group> (<year>2023</year>). <source>Food and Agricultural data</source>. Available at: <uri xlink:href="https://www.fao.org/faostat/en/#home">https://www.fao.org/faostat/en/#home</uri> (Accessed <access-date>July 13, 2023</access-date>).</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fickett</surname> <given-names>N. D.</given-names>
</name>
<name>
<surname>Ebrahimi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Parco</surname> <given-names>A. P.</given-names>
</name>
<name>
<surname>Gutierrez</surname> <given-names>A. V.</given-names>
</name>
<name>
<surname>Hale</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Pontif</surname> <given-names>M. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>An enriched sugarcane diversity panel for utilization in genetic improvement of sugarcane</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>13390</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-020-70292-8</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Formann</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hahn</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Janke</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Stinner</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Str&#xe4;uber</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Logro&#xf1;o</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Beyond sugar and ethanol production: value generation opportunities through sugarcane residues</article-title>. <source>Front. Energy Res.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fenrg.2020.579577</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garrison</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Marth</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Haplotype-based variant detection from short-read sequencing</article-title>. <source>arXiv.org</source>.</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granato</surname> <given-names>I. S. C.</given-names>
</name>
<name>
<surname>Galli</surname> <given-names>G.</given-names>
</name>
<name>
<surname>de Oliveira Couto</surname> <given-names>E. G.</given-names>
</name>
<name>
<surname>e Souza</surname> <given-names>M. B.</given-names>
</name>
<name>
<surname>Mendon&#xe7;a</surname> <given-names>L. F.</given-names>
</name>
<name>
<surname>Fritsche-Neto</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>snpReady: a tool to assist breeders in genomic analysis</article-title>. <source>Mol. Breed.</source> <volume>38</volume>, <fpage>102</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11032-018-0844-8</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grivet</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Daniels</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Glaszmann</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>A review of recent molecular genetics evidence for sugarcane evolution and domestication</article-title>. <source>Ethnobot. Res. Appl.</source> <volume>2</volume>, <fpage>009</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.17348/era.2.0.9-17</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Grivet</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Glaszmann</surname> <given-names>J.-C.</given-names>
</name>
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2006</year>). &#x201c;<article-title>3. Molecular evidence of sugarcane evolution and domestication</article-title>,&#x201d; in <source>3. Molecular evidence of sugarcane evolution and domestication</source> (<publisher-loc>New York</publisher-loc>: <publisher-name>Columbia University Press</publisher-name>), <fpage>49</fpage>&#x2013;<lpage>66</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.7312/motl13316-004</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hale</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Todd</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Gravois</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Mollov</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Malapi-Wight</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Momotaz</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Sugarcane breeding programs in the USA</article-title>. <source>Sugar Tech</source> <volume>24</volume>, <fpage>97</fpage>&#x2013;<lpage>111</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12355-021-01018-x</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hemaprabha</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Pathy</surname> <given-names>T. L.</given-names>
</name>
<name>
<surname>Mohanraj</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Alarmelu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ram</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Population structure of coimbatore canes developed in a century of sugarcane breeding in India</article-title>. <source>Sugar Tech</source> <volume>24</volume>, <fpage>1449</fpage>&#x2013;<lpage>1460</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12355-021-01093-0</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoang</surname> <given-names>N. V.</given-names>
</name>
<name>
<surname>Furtado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Botha</surname> <given-names>F. C.</given-names>
</name>
<name>
<surname>Simmons</surname> <given-names>B. A.</given-names>
</name>
<name>
<surname>Henry</surname> <given-names>R. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Potential for genetic improvement of sugarcane as a source of biomass for biofuels</article-title>. <source>Front. Bioeng. Biotechnol.</source> <volume>3</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fbioe.2015.00182</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jo</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>G. W.</given-names>
</name>
<name>
<surname>Kwon</surname> <given-names>J.-K.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>B.-C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Development of a panel of genotyping-in-thousands by sequencing in capsicum</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.769473</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalinowski</surname> <given-names>S. T.</given-names>
</name>
<name>
<surname>Wagner</surname> <given-names>A. P.</given-names>
</name>
<name>
<surname>Taper</surname> <given-names>M. L.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>ml-relate: a computer program for maximum likelihood estimation of relatedness and relationship</article-title>. <source>Mol. Ecol. Notes</source> <volume>6</volume>, <fpage>576</fpage>&#x2013;<lpage>579</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1471-8286.2006.01256.x</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kamvar</surname> <given-names>Z. N.</given-names>
</name>
<name>
<surname>Tabima</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Gr&#xfc;nwald</surname> <given-names>N. J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Poppr: an R package for genetic analysis of populations with clonal, partially clonal, and/or sexual reproduction</article-title>. <source>PeerJ</source> <volume>2</volume>, <elocation-id>e281</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7717/peerj.281</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kopelman</surname> <given-names>N. M.</given-names>
</name>
<name>
<surname>Mayzel</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jakobsson</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Rosenberg</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Mayrose</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Clumpak: a program for identifying clustering modes and packaging population structure inferences across K</article-title>. <source>Mol. Ecol. Resour.</source> <volume>15</volume>, <fpage>1179</fpage>&#x2013;<lpage>1191</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1755-0998.12387</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lam</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Shine</surname> <given-names>J.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Da Silva</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lawton</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bonos</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Calvino</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Improving sugarcane for biofuel: engineering for an even better feedstock</article-title>. <source>GCB Bioenergy</source> <volume>1</volume>, <fpage>251</fpage>&#x2013;<lpage>255</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1757-1707.2009.01016.x</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Langmead</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Salzberg</surname> <given-names>S. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Fast gapped-read alignment with Bowtie 2</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>357</fpage>&#x2013;<lpage>359</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Duan</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jing</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kuang</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Comparative analysis of chloroplast genome in saccharum spp. and related members of &#x2018;Saccharum complex.&#x2019;</article-title>. <source>Int. J. Mol. Sci.</source> <volume>23</volume>, <elocation-id>7661</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/ijms23147661</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>Y. H.</given-names>
</name>
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Walker</surname> <given-names>D. I. T.</given-names>
</name>
<name>
<surname>Rao</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Feldmann</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Glaszmann</surname> <given-names>J. C.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Relationships among ancestral species of sugarcane revealed with RFLP using single copy maize nuclear probes</article-title>. <source>Euphytica</source> <volume>78</volume>, <fpage>7</fpage>&#x2013;<lpage>18</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF00021393</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Manechini</surname> <given-names>J. R. V.</given-names>
</name>
<name>
<surname>Costa</surname> <given-names>J. B.</given-names>
</name>
<name>
<surname>Pereira</surname> <given-names>B. T.</given-names>
</name>
<name>
<surname>Carlini-Garcia</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Xavier</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>de A.</surname> <given-names>M. G.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Unraveling the genetic structure of Brazilian commercial sugarcane cultivars through microsatellite markers</article-title>. <source>PloS One</source> <volume>13</volume>, <elocation-id>e0195623</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0195623</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Moore</surname> <given-names>P. H.</given-names>
</name>
<name>
<surname>Paterson</surname> <given-names>A. H.</given-names>
</name>
<name>
<surname>Tew</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2013</year>). &#x201c;<article-title>Sugarcane: the crop, the plant, and domestication</article-title>,&#x201d; in <source>Sugarcane: physiology, biochemistry, and functional biology</source> (<publisher-loc>Hoboken, NJ</publisher-loc>: <publisher-name>John Wiley &amp; Sons, Ltd</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>17</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/9781118771280.ch1</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nayak</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Villa</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Pathak</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Ayala-Silva</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Promoting Utilization of Saccharum spp. Genetic Resources through Genetic Diversity Analysis and Core Collection Construction</article-title>. <source>PloS One</source> <volume>9</volume>, <elocation-id>e110856</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0110856</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parco</surname> <given-names>A. S.</given-names>
</name>
<name>
<surname>Hale</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Avellaneda</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Hoy</surname> <given-names>J. W.</given-names>
</name>
<name>
<surname>Kimbeng</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Pontif</surname> <given-names>M. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Distribution and frequency of Bru1, a major brown rust resistance gene, in the sugarcane world collection</article-title>. <source>Plant Breed.</source> <volume>136</volume>, <fpage>637</fpage>&#x2013;<lpage>651</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbr.12508</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peakall</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Smouse</surname> <given-names>P. E.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>genalex 6: genetic analysis in Excel. Population genetic software for teaching and research</article-title>. <source>Mol. Ecol. Notes</source> <volume>6</volume>, <fpage>288</fpage>&#x2013;<lpage>295</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1471-8286.2005.01155.x</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peakall</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Smouse</surname> <given-names>P. E.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>GenAlEx 6.5: genetic analysis in Excel. Population genetic software for teaching and research&#x2014;an update</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>2537</fpage>&#x2013;<lpage>2539</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts460</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Piperidis</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Piperidis</surname> <given-names>N.</given-names>
</name>
<name>
<surname>D&#x2019;Hont</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Molecular cytogenetic investigation of chromosome composition and transmission in sugarcane</article-title>. <source>Mol. Genet. Genomics</source> <volume>284</volume>, <fpage>65</fpage>&#x2013;<lpage>73</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00438-010-0546-3</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pompidor</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Charron</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Hervouet</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Bocs</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Droc</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Rivallan</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Three founding ancestral genomes involved in the origin of sugarcane</article-title>. <source>Ann. Bot.</source> <volume>127</volume>, <fpage>827</fpage>&#x2013;<lpage>840</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aob/mcab008</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pritchard</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Stephens</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Donnelly</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Inference of population structure using multilocus genotype data</article-title>. <source>Genetics</source> <volume>155</volume>, <fpage>945</fpage>&#x2013;<lpage>959</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/genetics/155.2.945</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Purseglove</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1972</year>). <source>Tropical crops: monocotyledons</source> (<publisher-loc>London</publisher-loc>: <publisher-name>Longman Group</publisher-name>).</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raboin</surname> <given-names>L.-M.</given-names>
</name>
<name>
<surname>Oliveira</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Lecunff</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Telismart</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Roques</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Butterfield</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>Genetic mapping in sugarcane, a high polyploid, using bi-parental progeny: identification of a gene controlling stalk colour and a new rust resistance gene</article-title>. <source>TAG Theor. Appl. Genet. Theor. Angew. Genet.</source> <volume>112</volume>, <fpage>1382</fpage>&#x2013;<lpage>1391</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-006-0240-3</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname> <given-names>R. B.</given-names>
</name>
<name>
<surname>Mahenderakar</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Jugran</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Singh</surname> <given-names>R. K.</given-names>
</name>
<name>
<surname>Srivastava</surname> <given-names>R. K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessing genetic diversity and population structure of sugarcane cultivars, progenitor species and genera using microsatellite (SSR) markers</article-title>. <source>Gene</source> <volume>753</volume>, <elocation-id>144800</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gene.2020.144800</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Resende</surname> <given-names>M. F. R.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Neves</surname> <given-names>L. G.</given-names>
</name>
<name>
<surname>Todd</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Natural allelic variations in highly polyploidy saccharum complex</article-title>. <source>Front. Plant Sci.</source> <volume>7</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2016.00804</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorrells</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Development and application of RFLPs in polyploids</article-title>. <source>Crop Sci.</source> <volume>32</volume>, <elocation-id>cropsci1992.0011183X003200050003x</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci1992.0011183X003200050003x</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spangler</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Zaitchik</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Russo</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Kellogg</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Andropogoneae evolution and generic limits in sorghum (Poaceae) using ndhF sequences</article-title>. <source>Syst. Bot.</source> <volume>24</volume>, <fpage>267</fpage>&#x2013;<lpage>281</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2307/2419552</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waits</surname> <given-names>L. P.</given-names>
</name>
<name>
<surname>Luikart</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Taberlet</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Estimating the probability of identity among genotypes in natural populations: cautions and guidelines</article-title>. <source>Mol. Ecol.</source> <volume>10</volume>, <fpage>249</fpage>&#x2013;<lpage>256</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1046/j.1365-294x.2001.01185.x</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Fang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Advances in sugarcane genomics and genetics</article-title>. <source>Sugar Tech</source> <volume>24</volume>, <fpage>354</fpage>&#x2013;<lpage>368</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12355-021-01065-4</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Warner</surname> <given-names>J. N.</given-names>
</name>
</person-group> (<year>1962</year>). <article-title>Sugar cane: an indigenous papuan cultigen</article-title>. <source>Ethnology</source> <volume>1</volume>, <fpage>405</fpage>&#x2013;<lpage>411</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2307/3772848</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weir</surname> <given-names>B. S.</given-names>
</name>
<name>
<surname>Hill</surname> <given-names>W. G.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Estimating F-statistics</article-title>. <source>Annu. Rev. Genet.</source> <volume>36</volume>, <fpage>721</fpage>&#x2013;<lpage>750</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.genet.36.050802.093940</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>S.-J.</given-names>
</name>
<name>
<surname>Pan</surname> <given-names>Y.-B.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Population Structure and Genetic Diversity Analysis in Sugarcane (Saccharum spp. hybrids) and Six Related Saccharum Species</article-title>. <source>Agronomy</source> <volume>12</volume>, <elocation-id>412</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/agronomy12020412</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Todd</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Sood</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genome-wide association study of multiple yield traits in a diversity panel of polyploid sugarcane (Saccharum spp.)</article-title>. <source>Plant Genome</source> <volume>13</volume>, <elocation-id>e20006</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/tpg2.20006</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Song</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Todd</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Paudel</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Target enrichment sequencing of 307 germplasm accessions identified ancestry of ancient and modern hybrids and signatures of adaptation and selection in sugarcane (Saccharum spp.), a &#x2018;sweet&#x2019; crop with &#x2018;bitter&#x2019; genomes</article-title>. <source>Plant Biotechnol. J.</source> <volume>17</volume>, <fpage>488</fpage>&#x2013;<lpage>498</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/pbi.12992</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>You</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Islam</surname>
</name>
<name>
<surname>Md.</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Sood</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Development of an Axiom Sugarcane100K SNP array for genetic map construction and QTL identification</article-title>. <source>Theor. Appl. Genet.</source> <volume>132</volume>, <fpage>2829</fpage>&#x2013;<lpage>2845</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00122-019-03391-4</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Mischke</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Goenaga</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Hemeida</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Saunders</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Accuracy and reliability of high-throughput microsatellite genotyping for cacao clone identification</article-title>. <source>Crop Sci.</source> <volume>46</volume>, <fpage>2084</fpage>&#x2013;<lpage>2092</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2135/cropsci2006.01.0004</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Vega</surname> <given-names>F. E.</given-names>
</name>
<name>
<surname>Infante</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Solano</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>Meinhardt</surname> <given-names>L. W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Accurate differentiation of green beans of arabica and robusta coffee using nanofluidic array of single nucleotide polymorphism (SNP) markers</article-title>. <source>J. AOAC Int.</source> <volume>103</volume>, <fpage>315</fpage>&#x2013;<lpage>324</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/jaocint/qsz002</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Hua</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Ma</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Allele-defined genome of the autopolyploid sugarcane Saccharum spontaneum L</article-title>. <source>Nat. Genet.</source> <volume>50</volume>, <fpage>1565</fpage>&#x2013;<lpage>1573</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41588-018-0237-2</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ziarsolo</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Hasing</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Hilario</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Garcia-Carpintero</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Blanca</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Bombarely</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>K-seq, an affordable, reliable, and open Klenow NGS-based genotyping technology</article-title>. <source>Plant Methods</source> <volume>17</volume>, <elocation-id>30</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13007-021-00733-6</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>