<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2023.1070600</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Evolutionary and phylogenetic analyses of 11 <italic>Cerasus</italic> species based on the complete chloroplast genome</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wan</surname>
<given-names>Tian</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2221125"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Qiao</surname>
<given-names>Bai-xue</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Jing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Shao</surname>
<given-names>Ke-sen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Pan</surname>
<given-names>Liu-yi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2197761"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>An</surname>
<given-names>Feng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Xu-sheng</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Tao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Ping-ke</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Cai</surname>
<given-names>Yu-liang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2041960"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>College of Horticulture, Northwest Agriculture &amp; Forestry University</institution>, <addr-line>Yangling</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>College of Natural Resources and Environment, Northwest Agriculture &amp; Forestry University</institution>, <addr-line>Yangling</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Center of Experimental Station, Northwest Agriculture &amp; Forestry University</institution>, <addr-line>Yangling</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Peter Poczai, University of Helsinki, Finland</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Emre Sevindik, Adnan Menderes University, T&#xfc;rkiye; Woojong Jang, Herbal Medicine Research Department, Korea Institute of Oriental Medicine (KIOM), Republic of Korea</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Yu-liang Cai, <email xlink:href="mailto:yuanyicyl@nwafu.edu.cn">yuanyicyl@nwafu.edu.cn</email>
</p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Plant Systematics and Evolution, a section of the journal Frontiers in Plant Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>03</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1070600</elocation-id>
<history>
<date date-type="received">
<day>15</day>
<month>10</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>02</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Wan, Qiao, Zhou, Shao, Pan, An, He, Liu, Li and Cai</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Wan, Qiao, Zhou, Shao, Pan, An, He, Liu, Li and Cai</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The subgenus <italic>Cerasus</italic>, one of the most important groups in the genus <italic>Prunus sensu lato</italic>, comprises over 100 species; however, the taxonomic classification and phylogenetic relationships of <italic>Cerasus</italic> remain controversial. Therefore, it is necessary to reconstruct the phylogenetic tree for known <italic>Cerasus</italic> species. Here, we report the chloroplast (cp) genome sequences of 11 <italic>Cerasus</italic> species to provide insight into evolution of the plastome. The cp genomes of the 11 <italic>Cerasus</italic> species (157,571&#x2013;158,830 bp) displayed a typical quadripartite circular structure. The plastomes contain 115 unique genes, including 80 protein-coding genes, four ribosomal RNAs, and 31 transfer RNAs. Twenty genes were found to be duplicated in inverted repeats as well as at the boundary. The conserved non-coding sequences showed significant divergence compared with the coding regions. We found 12 genes and 14 intergenic regions with higher nucleotide diversity and more polymorphic sites, including <italic>matK</italic>, <italic>rps16</italic>, <italic>rbcL</italic>, <italic>rps16</italic>-<italic>trnQ</italic>, <italic>petN</italic>-<italic>psbM</italic>, and <italic>trnL</italic>-<italic>trnF</italic>. During cp plastome evolution, the codon profile has been strongly biased toward the use of A/T at the third base, and leucine and isoleucine codons appear the most frequently. We identified strong purifying selection on the <italic>rpoA</italic>, <italic>cemA</italic>, <italic>atpA</italic>, and <italic>petB</italic> genes; whereas <italic>ccsA</italic>, <italic>rps19</italic>, <italic>matK</italic>, <italic>rpoC2</italic>, <italic>ycf2</italic> and <italic>ndhI</italic> showed a signature of possible positive selection during the course of <italic>Cerasus</italic> evolution. In addition, we further analyzed the phylogenetic relationships of these species with 57 other congenic related species.Through reconstructing the <italic>Cerasus</italic> phylogeny tree, we found that true cherry is similar to the flora of China forming a distinct group, from which <italic>P. mahaleb</italic> was separated as an independent subclade. <italic>Microcerasus</italic> was genetically closer to <italic>Amygdalus</italic>, <italic>Armeniaca</italic>, and <italic>Prunus</italic> (<italic>sensu stricto</italic>) than to members of true cherry, whereas <italic>P. japonica</italic> and <italic>P. tomentosa</italic> were most closely related to <italic>P. triloba</italic> and <italic>P. pedunculata</italic>. However, <italic>P. tianshanica</italic> formed a clade with <italic>P. cerasus</italic>, <italic>P. fruticosa</italic>, <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019;, and <italic>P. avium</italic> as a true cherry group. These results provide new insights into the plastome evolution of <italic>Cerasus</italic>, along with potential molecular markers and candidate DNA barcodes for further phylogenetic and phylogeographic analyses of <italic>Cerasus</italic> species.</p>
</abstract>
<kwd-group>
<kwd>
<italic>Prunus</italic>
</kwd>
<kwd>plastome</kwd>
<kwd>genomic variation</kwd>
<kwd>repeat sequence</kwd>
<kwd>protein-coding gene</kwd>
<kwd>phylogeny</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="65"/>
<page-count count="13"/>
<word-count count="7510"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Rosaceae is a large family that includes most economically important fruits species in temperate zones, such as <italic>Prunus</italic>, <italic>Armeniaca</italic>, <italic>Amygdalus</italic>, <italic>Pyrus</italic>, <italic>Malus</italic> and <italic>Crataegus</italic> species (<xref ref-type="bibr" rid="B62">Zarei et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B46">Sevindik et&#xa0;al., 2020</xref>). And the plant subgenus <italic>Cerasus</italic> is considered one of the most important groups in the genus <italic>Prunus (P.) sensu lato</italic>, comprising over 100 species, which are naturally distributed in temperate Asia, Europe, North America, China, Japan, and Korea (<xref ref-type="bibr" rid="B10">Chin et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). In China, there are roughly 45 species of <italic>Cerasus</italic>, 35 of which are considered to be endemic according to the Flora of China project (<xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al., 1986</xref>). However, the taxonomic classification and phylogenetic relationships among species in the subgenus <italic>Cerasus</italic> or genus <italic>Prunus sensu lato</italic> have been controversial, with no unification reached to date (<xref ref-type="bibr" rid="B43">Potter et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B10">Chin et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B32">Liang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). For example, <italic>P. tomentosa</italic>, <italic>P. tianshanica</italic>, <italic>P. japonica</italic>, <italic>P. humilis</italic>, <italic>P. dictyoneura</italic>, <italic>P. glandulosa</italic>, <italic>P. pogonostyla</italic>, <italic>P. jacquemontii</italic>, <italic>P. prostrata</italic>, and <italic>P. pumila</italic> were classified in a single group, the &#x201c;dwarf cherry&#x201d; (<italic>Microcerasus</italic>), which was identified as a section of subgenus <italic>Cerasus</italic> according to <xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al. (1986)</xref> and <xref ref-type="bibr" rid="B56">Webster and Looney (1996)</xref>. However, in previous phylogenetic studies, <italic>Microcerasus</italic> species corresponded with <italic>Amygdalus</italic>, <italic>Armeniaca</italic>, or <italic>Prunus</italic> species (<xref ref-type="bibr" rid="B5">Bortiri et&#xa0;al., 2001</xref>; <xref ref-type="bibr" rid="B48">Shaw and Small, 2004</xref>; <xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). Therefore, it is necessary to reconstruct the phylogenetic tree for <italic>Cerasus</italic> species.</p>
<p>The origin of the chloroplast (cp) can be traced back more than one billion years (<xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>). In land plants, the cp genome has a relatively conserved quadripartite structure, with conserved sequences in the range of 120&#x2013;218 kb (<xref ref-type="bibr" rid="B11">Daniell et&#xa0;al., 2016</xref>) encoding approximately 100&#x2013;130 genes (<xref ref-type="bibr" rid="B42">Palmer, 1985</xref>; <xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B57">Wicke et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B11">Daniell et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>). The cp structure comprises one large single-copy (LSC) region, one small single-copy (SSC) region, and two copies of an inverted repeat (IR) (<xref ref-type="bibr" rid="B49">Sugiura, 1992</xref>; <xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>). The significant developmental impact and limited coding potential of the cp genome, combined with maternal inheritance of this organelle provide tangible, causal approaches to understanding plant evolution, diversity, and phylogenic relationships (<xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B38">Moore et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B17">Greiner et&#xa0;al., 2011</xref>). Recent studies have demonstrated that cp genome sequences offer remarkable resolution for analyzing phylogenetic relationships at various taxonomic levels, and can further provide evidence to explain effects of geography and climate oscillations on genetic divergence (<xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B58">Xue et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B13">Dunning et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B53">Wang et&#xa0;al., 2022</xref>). Although cp genome sequences of some <italic>Cerasus</italic> species have been published (<xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B14">Feng et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B31">Li et&#xa0;al., 2022</xref>), there is still a lack of information to enable comprehensive analysis of the interspecific relationships of the subgenus <italic>Cerasus</italic> and the relationship between <italic>Cerasus</italic> and <italic>Prunus sensu lato</italic>. Comparison of the cp genomes of the 11 <italic>Cerasus</italic> species can help to better understand evolution of the <italic>Cerasus</italic> genome and enable more profound analysis of the phylogenetic relationships in the genus <italic>Prunus</italic>, offering valuable insights.</p>
<p>In this study, we performed a comparative analysis of 11 complete <italic>Cerasus</italic> cp genomes to explore the features and structural differentiation of sequences among species. Furthermore, we reconstructed a phylogenetic tree using the newly obtained cp chloroplast sequences and published sequences to explore the genetic relationships among subgenus <italic>Cerasus</italic>, <italic>Prunus</italic> (<italic>sensu stricto</italic>), <italic>Amygdalus</italic>, and <italic>Armeniaca</italic>. Our study objectives were to: (1) gain insight into plastome structure features, (2) inform an improved understanding of cp genome evolution, and (3) further delineate the taxonomic status of <italic>Cerasus</italic>.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Plant materials, sequencing, cp genome assembly, and annotation</title>
<p>Fresh and healthy leaves were collected from adult plants of 11 <italic>Cerasus</italic> species (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). All samples were immediately frozen in liquid nitrogen and stored at &#x2212;80&#xb0;C until analysis. Total genomic DNA was extracted from 100 mg of fresh leaves using a modified CTAB method (<xref ref-type="bibr" rid="B40">Murray and Thompson, 1980</xref>). DNA libraries were prepared and sequenced on an Illumina NovaSeq 6000 platform (Illumina, San Diego, CA, USA) with paired-end 150-bp sequencing reads; only reads with a Q30 quality score greater than 80% were retained for analysis.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Sampling information for the <italic>Cerasus</italic> species.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">No.</th>
<th valign="middle" align="left">Species</th>
<th valign="middle" align="left">Origin</th>
<th valign="middle" align="left">Sampling sites, longitude, latitude</th>
<th valign="middle" align="left">GenBank number</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">
<italic>P. avium</italic> (wild)</td>
<td valign="top" align="left">Hungary</td>
<td valign="top" align="left">Mei County, Shaanxi, China<break/>E 107.9908&#xb0;, N 34.1123&#xb0;</td>
<td valign="top" align="left">OP598110</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">
<italic>P. cerasus</italic>
</td>
<td valign="top" align="left">Hungary</td>
<td valign="top" align="left">Mei County, Shaanxi, China<break/>E 107.9908&#xb0;, N 34.1123&#xb0;</td>
<td valign="top" align="left">MW477432</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">
<italic>P. cerasus &#xd7; P. canescens &#x2018;</italic>Gisela <italic>6&#x2019;</italic>
</td>
<td valign="top" align="left">Germany</td>
<td valign="top" align="left">Qishan County, Shaanxi, China<break/>E 107.6371&#xb0;, N 34.3749&#xb0;</td>
<td valign="top" align="left">MW477433</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">
<italic>P. fruticosa</italic>
</td>
<td valign="top" align="left">Hungary</td>
<td valign="top" align="left">Mei County, Shaanxi, China<break/>E 107.9908&#xb0;, N 34.1123&#xb0;</td>
<td valign="top" align="left">MW477434</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">
<italic>P. japonica</italic>
</td>
<td valign="top" align="left">Shanxi, China</td>
<td valign="top" align="left">Hongdong, Shanxi, China<break/>E 111.8234&#xb0;, N 36.4298&#xb0;</td>
<td valign="top" align="left">OP598111</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">
<italic>P. mahaleb</italic>
</td>
<td valign="top" align="left">Hungary</td>
<td valign="top" align="left">Mei County, Shaanxi, China<break/>E 107.9908&#xb0;, N 34.1123&#xb0;</td>
<td valign="top" align="left">MW477435</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">
<italic>P. serrula</italic>
</td>
<td valign="top" align="left">Yunnan, China</td>
<td valign="top" align="left">Mei County, Shaanxi, China<break/>E 107.9908&#xb0;, N 34.1123&#xb0;</td>
<td valign="top" align="left">MW477436</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">
<italic>P. serrulata</italic>
</td>
<td valign="top" align="left">Shandong, China</td>
<td valign="top" align="left">RiZhao, Shandong, China<break/>E 119.2087&#xb0;, N 35.7501&#xb0;</td>
<td valign="top" align="left">OP611546</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left">
<italic>P. tianshanica</italic>
</td>
<td valign="top" align="left">Xinjiang, China</td>
<td valign="top" align="left">Yili, Xinjiang, China<break/>E 81.2771&#xb0;, N 43.9094&#xb0;</td>
<td valign="top" align="left">OP598112</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">
<italic>P. tomentosa</italic>
</td>
<td valign="top" align="left">Shaanxi, China</td>
<td valign="top" align="left">Taibai, Shaanxi, China<break/>E 107.5947&#xb0;, N 34.0533&#xb0;</td>
<td valign="top" align="left">MW477437</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left">
<italic>P. trichostoma</italic>
</td>
<td valign="top" align="left">Xizang, China</td>
<td valign="top" align="left">Nyingchi, Xizang, China<break/>E 94.6609&#xb0;, N 29.6340&#xb0;</td>
<td valign="top" align="left">OP598113</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The cp genome assembly of <italic>Cerasus</italic> species was obtained by a baiting and iterative mapping approach (<xref ref-type="bibr" rid="B18">Hahn et&#xa0;al., 2013</xref>). The complete cp genome of <italic>P. persica</italic> (HQ336405) was downloaded from the National Center for Biotechnology Information (NCBI) database as a reference genome. Geneious Prime v2022.0.2 (<ext-link ext-link-type="uri" xlink:href="https://www.geneious.com/">https://www.geneious.com/</ext-link>) (<xref ref-type="bibr" rid="B25">Kearse et&#xa0;al., 2012</xref>) was used for sequence correction. The 11 <italic>Cerasus</italic> species were annotated by Geneious Prime v2022.0.2, using <italic>P. pseudocerasus</italic> (NC030599) and <italic>P. persica</italic> (HQ336405) as reference sequences, and were annotated using GeSeq (<ext-link ext-link-type="uri" xlink:href="https://chlorobox.mpimp-golm.mpg.de/geseq.html">https://chlorobox.mpimp-golm.mpg.de/geseq.html</ext-link>) with no reference sequence. Manual editing of annotated and non-annotated portions, including exons and introns, was then performed. The transfer RNA (tRNA) sequences were confirmed using tRNAscan-SE 2.0 (<xref ref-type="bibr" rid="B7">Chan et&#xa0;al., 2021</xref>). All annotations were checked against the reference genomes (NC030599, NC054254, and MZ145044). Genome maps were drawn using OrganellarGenomeDRAW (OGDRAW) (<xref ref-type="bibr" rid="B16">Greiner et&#xa0;al., 2019</xref>).</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Complete cp genome comparison</title>
<p>Plastome structures among <italic>Cerasus</italic> species, apple, pear, and grape were compared by the mVISTA percent identity plot in Shuffle-LAGAN mode to reveal the major genomic variations located in LSC and SSC regions (<xref ref-type="bibr" rid="B6">Brudno et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B15">Frazer et&#xa0;al., 2004</xref>). Subsequently, nucleotide diversity (<italic>Pi</italic>) and polymorphic sites (<italic>S</italic>) of single-copy genes and intergenic regions (IGRs) were estimated for the 11 species and <italic>P. pseudocerasus</italic> (NC030599) by DnaSP v.6 (<xref ref-type="bibr" rid="B45">Rozas et&#xa0;al., 2017</xref>). The plastome genetic architecture of the 11 <italic>Cerasus</italic> species, 24 <italic>Cerasus</italic> species available in NCBI, and six other species for the LSC/IR and SSC/IR boundaries were analyzed by Irscope (<xref ref-type="bibr" rid="B2">Amiryousefi et&#xa0;al., 2018</xref>).</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Repeat sequences analysis</title>
<p>Simple sequence repeats (SSRs) were examined by the Perl script MicroSAtellite (MISA) (<xref ref-type="bibr" rid="B4">Beier et&#xa0;al., 2017</xref>) with the following parameter settings: motif size of 1&#x2013;6 nucleotides; and minimum repeat unit of 10 for mononucleotides, 6 for dinucleotides, and 5 for tri-, tetra-, penta-, and hexa-nucleotides. Non-overlapping repeat sequences were identified by REPuter (<xref ref-type="bibr" rid="B29">Kurtz et&#xa0;al., 2001</xref>) (repeat unit length minimum &#x2265; 25 bp, Hamming distance = 3). Four matches of repeats were classified, namely forward, reverse, complement, and palindromic matches. The online program Tandem Repeats Finder (<ext-link ext-link-type="uri" xlink:href="http://tandem.bu.edu/trf/trf.html">http://tandem.bu.edu/trf/trf.html</ext-link>) was used to find the tandem repeat sequences of at least 10 bp in length. The alignment parameters for match, mismatch, and indels were set to 2, 7, and 7, respectively.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Codon usage bias and gene selective pressure analysis</title>
<p>For identification of codon usage patterns, all coding sequences (CDSs) greater than 350 nucleotides in length were extracted from the cp genome of <italic>Cerasus</italic>, as described previously (<xref ref-type="bibr" rid="B39">Morton, 1998</xref>). The filtered CDSs were subsequently used for the estimation of codon usage using CodonW v.9.1.2 and the codon usage patterns were analyzed by GraphPad Prism v.8.0. In addition to the overall codon usage, we further tabulated codon usage measures such as the effective number of codons (Nc) and GC frequency at the third synonymous position (GC3s). To investigate the selective pressure on plastome protein-coding genes between two species, non-synonymous (Ka) and synonymous (Ks) substitution values were calculated by KaKs_Calculator 2.0 (<xref ref-type="bibr" rid="B55">Wang et&#xa0;al., 2010</xref>), with the following settings: genetic code table = 11 (bacterial and plant plastid codes) and the Yang-Nielsen algorithm (YN) calculation method (<xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Phylogenetic relationship</title>
<p>To reconstruct the phylogenetic relationships and verify the phylogenetic position of the subgenus <italic>Cerasus</italic> in <italic>Prunus sensu lato</italic>, 45 <italic>Cerasus</italic> cp genome sequences, including 34 published sequences downloaded from NCBI and the 11 sequences obtained in this study, were analyzed along with 23&#xa0;<italic>P.sensu lato</italic> complete cp genome sequences. <italic>Malus baccata</italic>, <italic>Malus micromalus</italic>, <italic>Pyrus communis</italic>, <italic>Pyrus ussuriensis</italic>, <italic>Vitis amurensis</italic>, <italic>V. amurensis</italic>, and <italic>Ziziphus jujuba</italic> were regarded as outgroups. Because the different regions of cp genome differed in the molecular evolutionary rates (<xref ref-type="bibr" rid="B64">Zhang et&#xa0;al., 2017</xref>), phylogenetic relationship analyses were performed using 6 datasets that are the complete cp genome sequences, LSC regions, SSC regions, two IR regions, common CDS and IGRs. Sequences were aligned by MAFFT using Geneious Prime v2022.0.2 (<xref ref-type="bibr" rid="B25">Kearse et&#xa0;al., 2012</xref>). The phylogenetic tree was constructed with the program Mrbayes (<xref ref-type="bibr" rid="B22">Huelsenbeck and Ronquist, 2001</xref>) of Geneious Prime and Maximum likelihood (ML) method of MEGA v11(<xref ref-type="bibr" rid="B28">Kumar et&#xa0;al., 2016</xref>), Mrbayes analysis used the following Markov chain Monte Carlo simulation settings: chain length = 1,100,000, subsampling frequency = 200, heated chains = 4, burn-in length = 100,000, heated chain temp = 0.2, and random seed = 170. ML analyses used the General Time Reversible +Gamma Distributed + Nearest-Neighbor-Interchange model with 1000 bootstrap replicates. The tree was visualized with Interactive Tree Of Life (iTOL) v5 software (<xref ref-type="bibr" rid="B30">Letunic and Bork, 2021</xref>) and manually edited where necessary.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Cp genome structure of <italic>Cerasus</italic> species</title>
<p>The <italic>Cerasus</italic> cp genome displays a typical quadripartite circular structure (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>) containing one LSC, one SSC, and two IR (IRB and IRA) regions, as determined by OGDRAW (<xref ref-type="bibr" rid="B16">Greiner et&#xa0;al., 2019</xref>). The plastome size of the 11 <italic>Cerasus</italic> species ranged from 157,571 bp (<italic>P. tomentosa</italic>) to 158,830 bp (<italic>P. tianshanica</italic>). The average coverage depth ranged from 421.8&#xd7; to 9410&#xd7; (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S1</bold>
</xref>). The GC content of the <italic>Cerasus</italic> cp genome was very similar among the 11 species (36.5&#x2013;36.8%) with an average of 36.7% (<xref ref-type="supplementary-material" rid="SM1">
<bold>Table S1</bold>
</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Chloroplast genome map of <italic>Cerasus</italic> species. Genes on the inside of the large circle are transcribed clockwise and those on the outside are transcribed counterclockwise. The genes are color-coded based on their functions. The dashed area represents the GC composition of the chloroplast genome. LSC, large single copy region; IR, inverted repeat; SSC, small single copy region.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g001.tif"/>
</fig>
<p>
<italic>Cerasus</italic> plastomes contained the same set of 115 unique genes, including 80 protein-coding genes, 4 ribosomal RNAs (rRNAs), and 31 tRNAs (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Twenty genes are duplicated in IRs or at the boundaries, including nine protein-coding genes (<italic>rpl2</italic>, <italic>rpl23</italic>, <italic>rps7</italic>, <italic>rps12</italic>, <italic>rps19</italic>, <italic>ndhB</italic>, <italic>ycf1</italic>, <italic>ycf2</italic>, and <italic>ycf15</italic>), four rRNA genes (<italic>rrn4.5</italic>, <italic>rrn5</italic>, <italic>rrn16</italic>, and <italic>rrn23</italic>), and seven tRNA genes (<italic>trnA-UGC</italic>, <italic>trnI-CAU</italic>, <italic>trnI-GAU</italic>, <italic>trnL-CAA</italic>, <italic>trnN-GUU</italic>, <italic>trnR-ACG</italic>, and <italic>trnV-GAC</italic>). In the cp genome of <italic>P. tianshanica</italic>, an insertion sequence was identified that split <italic>ycf2</italic> in IRA into two segments (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S2A</bold>
</xref>). There are 18 different intron-containing genes (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>), including 10 protein-coding genes (<italic>atpF</italic>, <italic>ndhA</italic>, <italic>ndhB</italic>, <italic>rpl2</italic>, <italic>rpl16</italic>, <italic>rps12</italic>, <italic>rps16</italic>, <italic>rpoC1</italic>, <italic>petB</italic>, and <italic>petD</italic>) and six tRNA-coding genes (<italic>trnA-UGC</italic>, <italic>trnG-UCC</italic>, <italic>trnI-GAU</italic>, <italic>trnK-UUU</italic>, <italic>trnL-UAA</italic>, and <italic>trnV-UAC</italic>). Among these, <italic>trnK-UUU</italic> has the largest intron (2428&#x2013;2539 bp) with <italic>matK</italic> located within it. Two protein-coding genes (<italic>clpP</italic> and <italic>ycf3</italic>) contain two introns.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Gene types and functional classification of the <italic>Cerasus</italic> chloroplast genome.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="left">Category</th>
<th valign="middle" align="center">Gene group</th>
<th valign="middle" colspan="5" align="center">Gene symbol</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Self-replication</td>
<td valign="middle" align="left">Ribosomal RNA genes</td>
<td valign="middle" align="left">
<italic>rrn4.5</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>rrn5</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>rrn16</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>rrn23</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Transfer RNA genes</td>
<td valign="middle" align="left">
<italic>trnA-UGC</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>trnC-GCA</italic>
</td>
<td valign="middle" align="left">
<italic>trnD-GUC</italic>
</td>
<td valign="middle" align="left">
<italic>trnE-UUC</italic>
</td>
<td valign="middle" align="left">
<italic>trnF-GAA</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnfM-CAU</italic>
</td>
<td valign="middle" align="left">
<italic>trnG-GCC</italic>
</td>
<td valign="middle" align="left">
<italic>trnG-UCC</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>trnH-GUG</italic>
</td>
<td valign="middle" align="left">
<italic>trnI-CAU</italic>
<sup>a</sup>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnI-GAU</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>trnK-UUU<sup>b</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>trnL-CAA</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>trnL-UAA</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>trnL-UAG</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnM-CAU</italic>
</td>
<td valign="middle" align="left">
<italic>trnN-GUU<sup>a</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>trnP-UGG</italic>
</td>
<td valign="middle" align="left">
<italic>trnQ-UUG</italic>
</td>
<td valign="middle" align="left">
<italic>trnR-ACG</italic>
<sup>a</sup>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnR-UCU</italic>
</td>
<td valign="middle" align="left">
<italic>trnS-AGA</italic>
</td>
<td valign="middle" align="left">
<italic>trnS-GCU</italic>
</td>
<td valign="middle" align="left">
<italic>trnS-GGA</italic>
</td>
<td valign="middle" align="left">
<italic>trnS-UGA</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnT-GGU</italic>
</td>
<td valign="middle" align="left">
<italic>trnT-UGU</italic>
</td>
<td valign="middle" align="left">
<italic>trnV-GAC<sup>a</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>trnV-UAC</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>trnW-CCA</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>trnY-GUA</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Small subunit of ribosome</td>
<td valign="middle" align="left">
<italic>rps2</italic>
</td>
<td valign="middle" align="left">
<italic>rps3</italic>
</td>
<td valign="middle" align="left">
<italic>rps4</italic>
</td>
<td valign="middle" align="left">
<italic>rps7</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>rps8</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>rps11</italic>
</td>
<td valign="middle" align="left">
<italic>rps12</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>rps14</italic>
</td>
<td valign="middle" align="left">
<italic>rps15</italic>
</td>
<td valign="middle" align="left">
<italic>rps16</italic>
<sup>b</sup>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>rps18</italic>
</td>
<td valign="middle" align="left">
<italic>rps19</italic>
<sup>d</sup>
</td>
<td valign="middle" align="left">
<italic>rps36</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Large subunit of ribosome</td>
<td valign="middle" align="left">
<italic>rpl2</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>rpl14</italic>
</td>
<td valign="middle" align="left">
<italic>rpl16</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>rpl20</italic>
</td>
<td valign="middle" align="left">
<italic>rpl22</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>rpl23</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>rpl32</italic>
</td>
<td valign="middle" align="left">
<italic>rpl33</italic>
</td>
<td valign="middle" align="left">
<italic>rpl36</italic>
</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">DNA-dependent RNA polymerase</td>
<td valign="middle" align="left">
<italic>rpoA</italic>
</td>
<td valign="middle" align="left">
<italic>rpoB</italic>
</td>
<td valign="middle" align="left">
<italic>rpoC1</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>rpoC2</italic>
</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Photosynthesis</td>
<td valign="middle" align="left">Subunits of photosystem I</td>
<td valign="middle" align="left">
<italic>psaA</italic>
</td>
<td valign="middle" align="left">
<italic>psaB</italic>
</td>
<td valign="middle" align="left">
<italic>psaC</italic>
</td>
<td valign="middle" align="left">
<italic>psaI</italic>
</td>
<td valign="middle" align="left">
<italic>psaJ</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Subunits of photosystem II</td>
<td valign="middle" align="left">
<italic>psbA</italic>
</td>
<td valign="middle" align="left">
<italic>psbB</italic>
</td>
<td valign="middle" align="left">
<italic>psbC</italic>
</td>
<td valign="middle" align="left">
<italic>psbD</italic>
</td>
<td valign="middle" align="left">
<italic>psbE</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>psbF</italic>
</td>
<td valign="middle" align="left">
<italic>psbH</italic>
</td>
<td valign="middle" align="left">
<italic>psbI</italic>
</td>
<td valign="middle" align="left">
<italic>psbJ</italic>
</td>
<td valign="middle" align="left">
<italic>psbK</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>psbL</italic>
</td>
<td valign="middle" align="left">
<italic>psbM</italic>
</td>
<td valign="middle" align="left">
<italic>psbN</italic>
</td>
<td valign="middle" align="left">
<italic>psbT</italic>
</td>
<td valign="middle" align="left">
<italic>psbZ</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Subunits of cytochrome</td>
<td valign="middle" align="left">
<italic>petA</italic>
</td>
<td valign="middle" align="left">
<italic>petB<sup>b</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>petD<sup>b</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>petG</italic>
</td>
<td valign="middle" align="left">
<italic>petL</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>petN</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Subunits of ATP synthase</td>
<td valign="middle" align="left">
<italic>atpA</italic>
</td>
<td valign="middle" align="left">
<italic>atpB</italic>
</td>
<td valign="middle" align="left">
<italic>atpE</italic>
</td>
<td valign="middle" align="left">
<italic>atpF<sup>b</sup>
</italic>
</td>
<td valign="middle" align="left">
<italic>atpH</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>atpI</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Large subunit of RuBisCO</td>
<td valign="middle" align="left">
<italic>rbcL</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Subunits of NADH dehydrogenase</td>
<td valign="middle" align="left">
<italic>ndhA</italic>
<sup>b</sup>
</td>
<td valign="middle" align="left">
<italic>ndhB</italic>
<sup>a;b</sup>
</td>
<td valign="middle" align="left">
<italic>ndhC</italic>
</td>
<td valign="middle" align="left">
<italic>ndhD</italic>
</td>
<td valign="middle" align="left">
<italic>ndhE</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>ndhF</italic>
</td>
<td valign="middle" align="left">
<italic>ndhG</italic>
</td>
<td valign="middle" align="left">
<italic>ndhH</italic>
</td>
<td valign="middle" align="left">
<italic>ndhI</italic>
</td>
<td valign="middle" align="left">
<italic>ndhJ</italic>
</td>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left">
<italic>ndhK</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left">Other genes</td>
<td valign="middle" align="left">Maturase</td>
<td valign="middle" align="left">
<italic>matK</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Translational initiation factor</td>
<td valign="middle" align="left">
<italic>infA</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Envelope membrane protein</td>
<td valign="middle" align="left">
<italic>cemA</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Subunit of acetyl-CoA</td>
<td valign="middle" align="left">
<italic>accD</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">C-type cytochrome synthesis gene</td>
<td valign="middle" align="left">
<italic>ccsA</italic>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Protease</td>
<td valign="middle" align="left">
<italic>clpP</italic>
<sup>c</sup>
</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="middle" align="left"/>
<td valign="middle" align="left">Proteins of unknown function</td>
<td valign="middle" align="left">
<italic>ycf1</italic>
<sup>a;d</sup>
</td>
<td valign="middle" align="left">
<italic>ycf2</italic>
<sup>a</sup>
</td>
<td valign="middle" align="left">
<italic>ycf4</italic>
</td>
<td valign="middle" align="left">
<italic>ycf3</italic>
<sup>c</sup>
</td>
<td valign="middle" align="left">
<italic>ycf15</italic>
<sup>a</sup>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>
<sup>a</sup>Two gene copies in inverted repeats; <sup>b</sup>gene containing a single intron; <sup>c</sup>gene containing two introns; <sup>d</sup>gene divided into two independent transcription units.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In <italic>Cerasus</italic> plastomes, the protein-coding gene <italic>rps19</italic> is located on the boundary of the LSC and IR regions, except for <italic>P. avium</italic> in which only the <italic>rps19</italic> fragment is on IRA. Comparison showed significant differences of <italic>rps19</italic> gene sequences among the <italic>Cerasus</italic> species (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S2B</bold>
</xref>). The <italic>ycf1</italic> gene was located on the boundary of the SSC and IRA regions. <italic>ycf</italic> genes were identified as hypothetical cp reading frames, and small fragments of truncated <italic>ycf</italic> genes were detected in IRA (<italic>ycf15</italic>: 126 bp and 129 bp, respectively), with only partial <italic>ycf1</italic> identified in the IRB region. The remaining <italic>ycf</italic> genes were detected at the complete gene size. <italic>ycf2</italic> is a large functional gene encoding 2277 amino acids in cp IR regions. The <italic>ycf2</italic> gene in <italic>P. tianshanica</italic> was 6876 bp, with one inserted fragment of 42 bp located at the 900-bp position (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S2A</bold>
</xref>). In <italic>Cerasus</italic>, a high level of similarity was restricted to the IRs, and major differences originated from the LSC and SSC regions. The gene <italic>infA</italic>, which is a translation-related gene, was identified as a pseudogene.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Complete cp genome sequence comparison of 11 <italic>Cerasus</italic> species</title>
<p>The mVISTA (<xref ref-type="bibr" rid="B15">Frazer et&#xa0;al., 2004</xref>) analysis showed the overall sequence identity, divergent regions, and visualization of the aligned cp genome sequences in <italic>Cerasus</italic>. The LSC and SSC regions were clearly more divergent than the IRs (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). The conserved non-coding sequences (CNSs) showed significantly more divergence than the coding regions (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM1">
<bold>Table S2</bold>
</xref>), indicating that the CDSs are much more conserved than the CNSs. Furthermore, the mean value of <italic>Pi</italic> in IRs (0.00157) was lower than that of the LSC (0.00719) or SSC (0.01041) regions, which demonstrated that the IR regions have fewer mutations and are thus more strongly conserved. Among 135 plastid genes, only 23 genes showed higher nucleotide diversity (<italic>Pi</italic> &gt; 0.003), with <italic>Pi</italic> values ranging from 0.00307 (<italic>rpoC2</italic>) to 0.00777 (<italic>rps15</italic>), and 12 genes (<italic>trnK-UUU</italic>, <italic>matK</italic>, <italic>rps16</italic>, <italic>trnG-UCC</italic>, <italic>rpoC2</italic>, <italic>rbcL</italic>, <italic>accD</italic>, <italic>clpP</italic>, <italic>rpl16</italic>, <italic>ndhF</italic>, <italic>ndhA</italic>, and <italic>ycf1</italic>) had a relatively higher number of polymorphic sites (<italic>S</italic> &gt; 10) (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S3</bold>
</xref>). However, 73 IGRs had <italic>Pi</italic> &gt; 0.003; the 10 most polymorphic IGRs in ascending order were <italic>rps19</italic>-<italic>trnG-GUU</italic> (<italic>Pi</italic> = 0.06926), <italic>trnR-UCU</italic>-<italic>atpA</italic>, <italic>ndhC</italic>-<italic>trnV-UAC</italic>, <italic>ccsA</italic>-<italic>ndhD</italic>, <italic>psbl</italic>-<italic>trnS-GCU</italic>, <italic>psbC</italic>-<italic>trnS-UGA</italic>, <italic>rpl32</italic>-<italic>trnS-AGA</italic>, <italic>rpl33</italic>-<italic>rps18</italic>, <italic>trnW-CCA</italic>-<italic>trnP-UGG</italic>, and <italic>psbZ</italic>-<italic>trnG-GCC</italic> (<italic>Pi</italic> = 0.01334). Moreover, there were 14 IGRs with <italic>Pi</italic> &gt; 0.01 and <italic>S</italic> &gt; 10 (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S3</bold>
</xref>). We further analyzed the sequence divergence patterns among all cp genomes. Finally, 506 single nucleotide polymorphisms (SNPs), 59 nucleotide substitution (NS) loci, and 1898 indel loci were identified through the nucleotide alignment (<xref ref-type="supplementary-material" rid="SM3">
<bold>Table S3</bold>
</xref>).</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Chloroplast genome sequence comparison of 11 <italic>Cerasus</italic> species, apple, pear, and grape based on mVISTA. The similarity graphical information portrays sequence identity with <italic>Prunus pseudocerasus</italic> (NC030599) as reference. A cut-off of 50% identity is used for the plots. In each plot, the Y-axis represents percent identity (50&#x2013;100%).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g002.tif"/>
</fig>
<p>Comparing the IR/LSC and IR/SSC boundaries of the 11 cp genomes of <italic>Cerasus</italic> species revealed the contraction and expansion of IRs with minimal variation at the boundaries. The boundary region of IRA/SSC appears to be relatively stable (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S3</bold>
</xref>). That is, the boundary gene <italic>ycf1</italic> showed high conservation among <italic>Cerasus</italic> species with a length of 5606 bp for the majority of the <italic>Cerasus</italic> species (7/11) analyzed. In <italic>P. serrulata</italic>, <italic>P. tomentosa</italic>, and <italic>P. japonica</italic>, <italic>ycf1</italic> had greater extension than found in the other species to different degrees (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>). Both the <italic>ycf1</italic> pseudogene and <italic>ndhF</italic> gene were at the IRB/SSC borders, which partially overlapped in the cp genomes of <italic>Cerasus</italic> species. The IRB/LSC junction was largely located in <italic>rps19</italic>, close to <italic>rpl22</italic> and <italic>rpl2</italic>, and except in <italic>P. avium</italic>, extension of the LSC resulted in larger contraction of IRB toward the <italic>rpl22</italic> direction. Concerning the IRA/LSC boundary, the junction site was the <italic>rps19</italic> gene in all <italic>Cerasus</italic> species, except for <italic>P. avium</italic> in which <italic>rps19</italic> showed a contraction in IRA regions, being 48 bp away from the boundary. In addition, <italic>trnH</italic> was consistently observed in all plastomes, which was located 5&#x2013;86 bp away from the border.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Comparison of the inverted repeat (IR)/large single copy (LSC) boundaries and IR/short single copy (SSC) boundaries among chloroplast genomes of 11 <italic>Cerasus</italic> species. JLA and JLB indicate the junction sites between the SSC and the two IRs (IRA and IRB); JSA and JSB denote the junction sites between the SSC and the two IRs.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g003.tif"/>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Repeat sequence analysis</title>
<p>The types and distribution of SSRs were analyzed in the cp genomes of the 11 <italic>Cerasus</italic> species. A total of 634 SSRs were identified by MISA, 61.51% of which were distributed in the IGR and 133 of which were found in CDSs (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>). Except for <italic>P. tianshanica</italic>, the SSRs were mainly enriched in the IGRs and CDSs, both accounting for 41.67% of all SSRs. For the other <italic>Cerasus</italic> species, SSRs were more abundant in IGRs than in other regions (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>). Moreover, four types of SSRs were identified: mono-, di-, and tri-nucleotide, and complex repeats. Mononucleotide repeats were the most common, accounting for 85.65% of the total (n =543, range 45&#x2013;54; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>). By contrast, only 31 dinucleotide repeats were identified (ranging from 1 to 5), accounting for 4.89% of the total, and only two trinucleotide repeats were found, in <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019; and <italic>P. tianshanica</italic>, respectively. No other polynucleotides were detected. In addition, the composition of the mononucleotide repeats was mostly A/T, with C and G repeats accounting for less than 6% of these repeats (<xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>), and all dinucleotide repeats were composed of AT/TA. For the non-overlapping repeats, there were 1164 forward repeats, 645 reverse repeats, 1160 palindromic repeats, 646 complement repeats, and 585 tandem repeats identified using REPuter (<xref ref-type="bibr" rid="B29">Kurtz et&#xa0;al., 2001</xref>) and Tandem Repeats Finder for the <italic>Cerasus</italic> plastomes (<xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4B</bold>
</xref>). Forward repeats were the most abundant (n = 73&#x2013;179), followed by palindromic repeats (n = 25&#x2013;173). Tandem repeats were the least abundant repeat type, ranging from 45 in <italic>P. mahaleb</italic> to 73 in <italic>P. tianshanica</italic> within 5&#x2013;249 bp (<xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4</bold>
</xref>). Dispersed repeats were more common in <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019; and <italic>P. tianshanica</italic> than in the other species (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref> and <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4B</bold>
</xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Repetitive motif abundance in 11 <italic>Cerasus</italic> species computed by REPuter and Tandem Repeats Finder. <bold>(A)</bold> Distribution and types of simple sequence repeats in the eleven chloroplast genomes. <bold>(B)</bold> Number of repeat types in the eleven chloroplast genomes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g004.tif"/>
</fig>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Codon usage bias and gene selective pressure analysis</title>
<p>A total of 49 <italic>Cerasus</italic> genes were selected based on the 350-bp length threshold for codon bias identification. Codon usage measures such as Nc; silent T, C, A, and G at the 3<sup>rd</sup> codon position (T3s, C3s, A3s and G3s, respectively); total number of amino acids (L_aa); aromaticity; and grand average of hydropathicity (GRAVY) were estimated (<xref ref-type="supplementary-material" rid="SM1">
<bold>Tables S4A</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S5</bold>
</xref>). The number of synonymous codons (L_sym) was approximately 49.7 and the range of L_aa, except for the termination codon (TER), was from 24,034 in <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019; to 24,421 in <italic>P. serrulata</italic>, with a relative synonymous codon usage (RSCU) value ranging from 0.38 (CUC) to 1.96 (UUA) (<xref ref-type="supplementary-material" rid="SM1">
<bold>Tables S5B, C</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S5</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5</bold>
</xref>). The average Nc was 49.74 for CDSs of the 11 <italic>Cerasus</italic> species, and the T3s, C3s, A3s, and G3s was 0.4674, 0.1718, 0.4356, and 0.1817, respectively. The mean of GC3s was 0.269 and the GC content was 0.376 (<xref ref-type="supplementary-material" rid="SM5">
<bold>Table S5A</bold>
</xref>). In addition, leucine and isoleucine were the most common codons (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). Methionine (AUG) and tryptophan (UGG) were each encoded by only one codon, and showed no codon bias (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). Codon usage was biased toward A and T at the third codon position. Almost all A/U-ending codons had RSCU values larger than 1.0, except for Ile-AUA, Leu-CUA, and TER-UGA, whereas all C/G-ending codons had RSCU values &#x2264; 1, except for Leu-UUG (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S5</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM5">
<bold>Table S5C</bold>
</xref>).</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Codon content of 20 amino acids and termination codons in protein-coding genes of <italic>Cerasus</italic> plastomes. The left columns of the histogram present codon usage and the right columns denote the relative synonymous codon usage (RSCU) values. Colors correspond to codons listed underneath the columns.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g005.tif"/>
</fig>
<p>The synonymous (Ks) and non-synonymous (Ka) nucleotide substitution patterns are very important markers in gene evolution studies (<xref ref-type="bibr" rid="B27">Kimura, 1989</xref>). In all protein-coding genes of <italic>Cerasus</italic>, <italic>ndhB</italic>, <italic>petL</italic>, <italic>psbH</italic>, <italic>rpl33</italic>, <italic>rps18</italic>, and <italic>ycf15</italic> had no nonsynonymous rate change, and 20 genes (<italic>psaJ</italic>, <italic>psbA</italic>, <italic>atpE ndhE</italic>, <italic>ndhJ</italic>, <italic>psaC</italic>, <italic>petD</italic>, <italic>ycf3</italic>, <italic>ycf4</italic>, three <italic>rpl</italic> genes, three <italic>rps</italic> genes, and five <italic>psb</italic> genes) had no synonymous rate change. Fourteen genes showed neither substitution, including <italic>rpl23</italic>, <italic>rps7</italic>, <italic>rps8</italic>, <italic>rps12</italic>, <italic>petG</italic>, <italic>petN</italic>, <italic>psaI</italic>, <italic>psbI</italic>, <italic>psbJ</italic>, <italic>psbK</italic>, <italic>psbL</italic>, <italic>psbM</italic>, <italic>psbN</italic>, and <italic>psbT</italic>. <xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6</bold>
</xref> lists the genes with both Ka and Ka substitutions. A Ka/Ks ratio &lt; 1, especially less than 0.5, indicates purifying selection; Ka/Ks &gt; 1 indicates likely positive selection; and Ka/Ks values close to 1 show neutral evolution, or relaxed selection (<xref ref-type="bibr" rid="B27">Kimura, 1989</xref>; <xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>). The average Ka/Ks ratio analyzed in the 11 genomes was 0.3158 for 34 protein-coding genes, which were not region-specific. Most protein-coding genes have undergone purifying selection: 33 coding genes showed Ka/Ks &lt; 1, ranging from 0.0301 (<italic>atpA</italic>) to 0.8861 (<italic>ccsA</italic>). <italic>ycf2</italic>_IRA showed Ka/Ks &gt; 1, whereas the ratio for the other <italic>ycf2</italic> gene on IRB was 0.2908. The <italic>ccsA</italic> and <italic>ndh</italic> genes (except for <italic>ndhK</italic> in the LSC region) were located in the SSC region, <italic>ycf1</italic> was located at the boundary of the LSC and IR regions, and other genes existed in the LSC. Moreover, Ka/Ks ratios in the range of 0.5&#x2013;1 were observed for the genes <italic>petA</italic>, <italic>rps15</italic>, and <italic>ccsA</italic>, with the value of <italic>ccsA</italic> being close to 1, indicating neutral evolution (<xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S6</bold>
</xref>). The Ka/Ks values of the remaining genes were between 0.04 and 0.50, with <italic>rpoA</italic>, <italic>atpA</italic>, <italic>pet</italic>B, <italic>cemA</italic>, and <italic>rpoC1</italic> showing patterns of strong purifying selection pressure (Ka/Ks &lt; 0.1). For <italic>ycf2</italic>_IRA, <italic>matK</italic>, <italic>rpoC2</italic>, <italic>ccsA</italic>, and <italic>ndhI</italic>, the Ka/Ks ratio was greater than 1 in a few cases between the species (<xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6B</bold>
</xref>), especially for <italic>ycf2</italic>_IRA in the comparison of <italic>P. tianshanica</italic> with other species. In addition, we analyzed the Ka/Ks ratios of the 10 cp genomes for comparison with <italic>P. avium</italic>, which reflected the selection pressure for the <italic>P. avium</italic> cp genome (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S7</bold>
</xref>). The average Ka/Ks values of most genes were less than 0.5, except for <italic>matK</italic>, <italic>rpoC2</italic>, and <italic>ycf2</italic>_IRA. The Ka/Ks value of <italic>matK</italic> was greater than 1 in the comparisons of <italic>P. avium</italic> with <italic>P. japonica</italic>, <italic>P. tomentosa</italic>, and <italic>P. tianshanica</italic> (<xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6C</bold>
</xref>).</p>
<p>We found that photosynthesis genes had varying Ka/Ks ratios, which were all less than 1, including one large subunit of the RuBisCO gene <italic>rbcL</italic> (0.1799&#x2013;0.4581); two subunits of the photosystem II genes <italic>psbB</italic> and <italic>psbC</italic> (0.0643&#x2013;0.2921); two subunits of the cytochrome genes <italic>petA</italic> and <italic>petB</italic> (0.0561&#x2013;0.6536); and three subunits of the ATP synthase genes <italic>atpA</italic>, <italic>atpB</italic>, and <italic>atpF</italic> (0.0301&#x2013;0.3146). The ratios of five subunits of NADH dehydrogenase genes (<italic>ndhA</italic>, <italic>ndhD</italic>, <italic>ndhH</italic>, <italic>ndhG</italic>, <italic>ndhG</italic> and <italic>ndhI</italic>) ranged from 0.04701 to 1.7677, and the Ka/Ks ratio of <italic>ndhI</italic> was greater than 1. Ka/Ks ratios of self-replicating genes were as follows: 0.0566&#x2013;0.8818 for ribosomal protein small subunit genes (<italic>rps3</italic>, <italic>rps4</italic>, <italic>rps15</italic>, <italic>rps16</italic>), 0.2447&#x2013;0.496 for ribosomal protein large subunit genes (<italic>rpl16</italic> and <italic>rpl20</italic>), and 0.0327&#x2013;1.1722 for DNA-dependent RNA polymerase genes (<italic>rpoA</italic>, <italic>rpoB</italic>, <italic>rpoC1</italic>, and <italic>rpoC2</italic>). Among these, only <italic>rpoC2</italic> had Ka/Ks &gt; 1. Among the other genes, <italic>matK</italic>, <italic>ccsA</italic>, <italic>cemA</italic>, <italic>clpP</italic>, <italic>accD</italic>, <italic>ycf1</italic>, and <italic>ycf2</italic>, the Ka/Ks ratios of <italic>matK, ycf2</italic>, and <italic>ccsA</italic> were more than 1 (<xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6B</bold>
</xref>).</p>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Phylogenetic analysis</title>
<p>Organelle genome sequencing plays a key role in deciphering the evolutionary phylogenomics and cladistics of plant species. Phylogenetic relationships of <italic>Cerasus</italic> species were estimated with 6 datasets respectively, using Bayesian inference (BI) and ML methods. The results showed the tree topologies based on LSC, SSC, CDS and IGS datasets is basically consistent with complete plastome, especially using BI method (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S8</bold>
</xref>&#x2013;<xref ref-type="supplementary-material" rid="SM1">
<bold>S12</bold>
</xref>). Phylogenetic relationships were almost as consistent with BI and ML with the complete cp genome sequences (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). In the ingroup, the subgenera <italic>Cerasus</italic>, <italic>Prunus</italic>, <italic>Armeniaca</italic>, and <italic>Amygdalus</italic> were divided into four major clades (clade I, clade II, clade III, and clade IV) with BI posterior probabilities (BIPP) of 100% and ML bootstrap support (MLBS) of 99&#x2013;100%. All of the clade I species belonged to subgenus <italic>Cerasus</italic> and all clade IV species belonged to subgenus <italic>Amygdalus</italic>. In clade III, only <italic>P. sibirica</italic> was an <italic>Armeniaca</italic> species, whereas the others belonged to <italic>Prunus</italic>. Among the four clades, clade II showed a relatively more complex composition, including dwarf cherry species (<italic>P. tomentosa</italic>, <italic>P. japonica</italic>, <italic>P. glandulosa</italic>, <italic>P. humilis</italic>, and <italic>P. dictyoneura</italic>) of <italic>Cerasus</italic>, <italic>Amygdalus</italic> (<italic>P. tenella</italic>, <italic>P. pedunculata</italic>, <italic>P. triloba</italic>), and <italic>Armeniaca</italic> (<italic>P. mume</italic>, <italic>P. mandshurica</italic>, and <italic>P. armeniaca</italic>). Through rebuilding the phylogenetic tree, clade II could be further divided into three small clades (BIPP = 99.87&#x2013;100%; MLBS = 94&#x2013;100%), named subclade I, subclade II, and subclade III, respectively. All species in subclade III belonged to <italic>Cerasus</italic>, and subclade I was also dominated by <italic>Cerasus</italic> except for <italic>P. triloba</italic>. Conversely, most of the subclade II species belonged to the subgenus <italic>Armeniaca</italic>, except for <italic>P. tenella</italic>. In clade I, <italic>P. mahaleb</italic> formed a separate branch (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). <italic>P. trichostoma</italic> was the closest relative to <italic>P. rufa</italic>. <italic>P. cerasodies</italic>, <italic>P. fruticosa</italic>, <italic>P. cerasus</italic>, <italic>P. tianshanica</italic>, and <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019; were divided into the same small clade, which was close to the clade formed by <italic>P. avium</italic>, <italic>P. clarofolia</italic>, and <italic>P. setulasa. P. serrula</italic> was divided into a clade with <italic>P. pseudocerasus</italic> and <italic>P. clarofolia</italic>. <italic>P. serrula</italic> was the closest relative to <italic>P. fengyangshanica</italic>, <italic>P. jamasakura</italic>, <italic>P. dielsiana</italic>, and seven other species. Surprisingly, <italic>P. tomentosa</italic> and <italic>P. japonica</italic> were separated from the majority of <italic>Cerasus</italic> species and were most closely related to <italic>P. triloba</italic> and <italic>P. pedunculata</italic> of the subgenus <italic>Amygdalus</italic> (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Phylogenetic tree reconstruction of 45 <italic>Cerasus</italic> species and 23 other Prunoideae species based on whole chloroplast genome sequences. <bold>(A)</bold> Phylogenetic tree reconstruction using the program Mrbayes of Geneious Prime v2022.0.2. Numbers above the lines represent the Bayesian inference posterior probability (percent). <bold>(B)</bold> Phylogenetic tree reconstruction using Maximum likelihood method of MEGA v11. Numbers below the lines represent the bootstrap support values.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-14-1070600-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<sec id="s4_1">
<label>4.1</label>
<title><italic>Cerasus</italic> cp genome features and genomic variation</title>
<p>The cp genome exhibits maternal inheritance in contrast to the nuclear genome (<xref ref-type="bibr" rid="B42">Palmer, 1985</xref>). Because of its evolutionarily conserved structure, sequence length, and constituent genes, the cp genome has been widely used in analyses of genetic variation and phylogeny with moderate base replacement (<xref ref-type="bibr" rid="B42">Palmer, 1985</xref>; <xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B57">Wicke et&#xa0;al., 2011</xref>). In this study, the 11 <italic>Cerasus</italic> cp genomes presented a typical quadripartite structure (LSC, SSC, IRA, and IRB), as reported for other <italic>Prunus</italic> species (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B31">Li et&#xa0;al., 2022</xref>) and land plants (<xref ref-type="bibr" rid="B57">Wicke et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B64">Zhang et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>). The <italic>Cerasus</italic> cp genome size (157,571&#x2013;158,830 bp) was similar to that of previously reported <italic>Prunus</italic> species such as <italic>P. pseudocerasus</italic> (157,834 bp), <italic>P. dielsiana</italic> (158,005 bp), <italic>P. clarofolia</italic> (157,899 bp), <italic>P. mira</italic> (158,153 bp), and <italic>P. salicina</italic> (157,916 bp) (<xref ref-type="bibr" rid="B14">Feng et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B3">Bao et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B65">Zhao et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B31">Li et&#xa0;al., 2022</xref>). This indicated that the length of the cp sequence is relatively conserved with only moderate variation among species of the <italic>Prunus</italic> genus.</p>
<p>Comparative analysis of <italic>Cerasus</italic> species showed that the LSC and SSC regions were more divergent than the IR regions (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>), whereas the CNSs showed significant divergence (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S3</bold>
</xref>), consistent with findings for other species (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>). One of the most important factors contributing to the variation in plastome size between species may be the expansion and contraction of IR boundaries (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). The contraction and expansion of <italic>rps19</italic> and <italic>ndhF</italic> were predicted as the main contributors to the overall variation observed among the <italic>Cerasus</italic> cp genomes, followed by expansion of <italic>ycf1</italic> toward the SSC region (<xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S4</bold>
</xref>). The three genes at IR boundaries were consistent in <italic>P. mume</italic>, <italic>P</italic>. <italic>salicina</italic>, and <italic>P. armeniaca</italic> (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>). Significant IR contraction of <italic>rps19</italic> and <italic>ndhF</italic> was observed in the plastomes of some <italic>Cerasus</italic> and other <italic>Prunus</italic> species (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B53">Wang et&#xa0;al., 2022</xref>). In addition, displacement of the <italic>trnH</italic> gene at the IR/LSC locus was detected in the aforementioned studies and the current study. This pattern of these four genes located at IR boundaries was also found in species of other genera, including <italic>Malus</italic> (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B53">Wang et&#xa0;al., 2022</xref>), <italic>Diospyros</italic> (<xref ref-type="bibr" rid="B19">Heinze et&#xa0;al., 2016</xref>), and <italic>Morella</italic> (<xref ref-type="bibr" rid="B34">Liu et&#xa0;al., 2017</xref>). Therefore, although the IR regions are highly conserved for stabilizing the cp genome structure (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>) (<xref ref-type="bibr" rid="B35">Marechal and Brisson, 2010</xref>), some changes (especially in <italic>rps19, ndhF</italic>, and <italic>ycf1</italic>) are evident at the IR border areas among <italic>Cerasus</italic> species, in line with reports for other species and genera.</p>
<p>We annotated 115 unique genes in this study (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>), which is similar to the findings reported for other <italic>Prunus</italic> plastomes with 110&#x2013;115 unique genes (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B51">Wang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B31">Li et&#xa0;al., 2022</xref>). There were four rRNA genes detected (4.5S rRNA, 5S rRNA, 16S rRNA, and 23S rRNA), which coincides with reports for land plants (<xref ref-type="bibr" rid="B49">Sugiura, 1992</xref>). The differences were mainly reflected in tRNA and protein-coding genes, such as <italic>ycf</italic> genes (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). The <italic>ycf15</italic> gene was detected in all 11 <italic>Cerasus</italic> cp genomes, but is lacking in some <italic>Prunus</italic> (<italic>sensu lato</italic>) plastomes (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). According to previous reports, angiosperm plastomes harbor approximately 70&#x2013;88 protein-coding genes (<xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>) and 80 unique protein-coding genes were annotated in this study. We found some CDSs and CNSs with relatively high nucleotide diversity (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S3</bold>
</xref>), which was in line with previous research (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>). Analyses of cp genes and genomes have largely contributed to resolving portions of the plant tree of life (<xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>). Various genes and IGRs have been identified as evolutionarily significant markers, which have been widely used for phylogenetic analyses (<xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>). Intergenic spacer regions were proposed to be the best barcoding candidates (<xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>), which was also confirmed in this study, and we further found that the <italic>Pi</italic> of the IGRs was higher than that of the CDSs (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S3</bold>
</xref>). Nevertheless, both the IGRs and CDSs can serve as useful molecular markers. Some genes (<italic>matK</italic>, <italic>rps16</italic>, <italic>rbcL</italic>, <italic>rpl16</italic>, <italic>ndhA, ndhF</italic>, and <italic>ycf1</italic>) and IGRs (<italic>rps16</italic>-<italic>trnQ</italic>, <italic>petN</italic>-<italic>psbM</italic>, <italic>rps15</italic>-<italic>ycf1</italic>, <italic>trn</italic>L-<italic>trnF</italic>) exhibited high nucleotide diversity (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>), which have also been used for phylogenetic and phylogeography analyses (<xref ref-type="bibr" rid="B44">Ravi et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B8">Chavez et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B50">Uchoi et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B60">Yang et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B26">Khan et&#xa0;al., 2018</xref>).</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Evolutionary and phylogenetic analysis</title>
<p>Repeats play an important role in genome rearrangement, which can increase the probability of replication fork stagnation, causing an error to recruit persistently specific sequence regions over evolutionary time scales (<xref ref-type="bibr" rid="B37">Mcdonald et&#xa0;al., 2011</xref>). Repetitive sequences may facilitate intermolecular recombination and enhance plastome diversity, as an abundance of sequence repeats results in genome regions with increased sequence diversity in prokaryotes and eukaryotes (<xref ref-type="bibr" rid="B37">Mcdonald et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>). We also found abundant repeats in the <italic>Cerasus</italic> genome, including dispersed, palindromic, and tandem repeats, along with SSRs (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>). More abundant SSRs were detected in IGRs for most species, except for <italic>P. tianshanica</italic> (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4A</bold>
</xref>) and other <italic>Prunus</italic> species (<xref ref-type="bibr" rid="B51">Wang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). Combined with the visualization of aligned genome sequences, CNSs showed more significant divergence (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). This suggested that repetitive CNSs might be the main force promoting cp genome rearrangement in <italic>Prunus</italic> species (<xref ref-type="bibr" rid="B51">Wang et&#xa0;al., 2021</xref>). Furthermore, given the characteristics of maternal inheritance, conservation, and simple structure of the cp genome, cp microsatellites with a high degree of polymorphism can serve as useful molecular markers to identify genetic relationships, population genetic structure, and phylogeography patterns at the inter- and intrapopulation levels (<xref ref-type="bibr" rid="B12">Decroocq et&#xa0;al., 2004</xref>; <xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>). We only detected mono-, di-, and tri-nucleotide repeats in the <italic>Cerasus</italic> cp genomes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM4">
<bold>Table S4</bold>
</xref>) with a greater content of A/T repeats than of G/C repeats, similar to the results of other studies in the genus <italic>Prunus</italic> (<xref ref-type="bibr" rid="B59">Xue et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). The SSRs identified in this study provide useful information for developing genetic markers to further study the population genetics, evolution, and breeding of the subgenus <italic>Cerasus</italic>, as well as for the identification and conservation of <italic>Cerasus</italic> species. Repetitive sequences are also essential for research on indels and substitutions (<xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>), which are highly abundant in the plastome of <italic>Cerasus</italic> (<xref ref-type="supplementary-material" rid="SM3">
<bold>Table S3</bold>
</xref>) and other members of the family Rosaceae (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>).</p>
<p>Codon usage and synonymous/nonsynonymous substitutions play an important role in cp plastome evolution (<xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B21">Huang et&#xa0;al., 2021</xref>). Mutation is one of the most essential factors affecting codon usage, thus influencing the evolutionary course (<xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B52">Wang et&#xa0;al., 2021</xref>). Moreover, codon-choice patterns are considered to be highly conserved during the evolution process (<xref ref-type="bibr" rid="B23">Ikemura, 1985</xref>). An RSCU value &gt; 1, &lt; 1, or = 1 indicates preference, low usage, and no preference for a codon, respectively (<xref ref-type="bibr" rid="B47">Sharp and Li, 1987</xref>). We found biased codon usage in the <italic>Cerasus</italic> cp genome, with 19 amino acids having an RSCU value &gt;1 (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S5</bold>
</xref>). The codon profile showed strong bias toward the use of A/T in the third-base position, which appears to be a general phenomenon (<xref ref-type="bibr" rid="B41">Murray et&#xa0;al., 1989</xref>). Leucine and isoleucine appeared the most frequently and were biased toward UUA and AUU, respectively (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S5</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5</bold>
</xref>), whereas cysteine was the least frequently detected, with the third base also biased toward T (UGU) in codon usage (<xref ref-type="supplementary-material" rid="SM1">
<bold>Figures S5</bold>
</xref>, <xref ref-type="fig" rid="f5">
<bold>5</bold>
</xref>). Among the three stop codons, there was clear usage bias toward UAA (RSCU &gt; 1.00) (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S5</bold>
</xref>). These results are largely consistent with reports of the cp genomes in <italic>P. zhengheensis</italic> (<xref ref-type="bibr" rid="B21">Huang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B51">Wang et&#xa0;al., 2021</xref>) and other species (<xref ref-type="bibr" rid="B1">Alzahrani et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B33">Liu et&#xa0;al., 2020</xref>). Two amino acids, methionine (AUG) and tryptophan (UGG), showed no codon usage bias (RSCU = 1.00) (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S5</bold>
</xref>). In other words, all amino acids are encoded by 2&#x2013;6 synonymous codons with the exception of methionine and tryptophan (<xref ref-type="bibr" rid="B41">Murray et&#xa0;al., 1989</xref>).</p>
<p>The Ka and Ks nucleotide substitution rates as well as the Ka/Ks ratio are widely used to evaluate the sequence divergence and purifying selection in protein-coding genes. In most genes, with the exception of very rapidly evolving genes, Ka nucleotide substitutions occur less frequently than Ks owing to the action of purifying selection (<xref ref-type="bibr" rid="B24">Ivanova et&#xa0;al., 2017</xref>). Ks nucleotide substitutions generally occur more frequently than Ka substitutions (<xref ref-type="bibr" rid="B34">Liu et&#xa0;al., 2017</xref>), which was also detected for <italic>Cerasus</italic> in this study. Among the changed genes, almost all Ka/Ks ratios were less than 1.0 (<xref ref-type="supplementary-material" rid="SM1">
<bold>Tables S5</bold>
</xref>, <xref ref-type="supplementary-material" rid="SM1">
<bold>S6</bold>
</xref>), providing evidence for purifying selection on the protein-coding genes of the cp genome in the genus <italic>Prunus</italic> and family Rosaceae. According to the Ka/Ks values, we found that <italic>rpoA</italic>, <italic>atpA, petB</italic>, <italic>cemA</italic>, and <italic>rpoC1</italic> exhibited strong purifying selection. The <italic>ccsA</italic> was under neutral selection, whereas <italic>ycf2</italic> genes showed a signature of possible positive selection during the course of <italic>Cerasus</italic> evolution (<xref ref-type="supplementary-material" rid="SM6">
<bold>Table S6</bold>
</xref>), owing to an inserted fragment in the middle of the gene (<xref ref-type="supplementary-material" rid="SF1">
<bold>Figure S2A</bold>
</xref>), in line with the Ka/Ks analyses. However, these patterns are in contrast to previous research on <italic>Cerasus</italic> (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>), in which the <italic>matK</italic> and <italic>rpoC2</italic> genes both showed signatures of positive selection, along with other genes such as <italic>ndhF</italic>, <italic>atpA</italic>, and <italic>psaA</italic>. Under conditions of extreme temperature and changing light intensity, the <italic>ndhF</italic> gene can balance the redox levels to maintain or enhance photosynthetic performance (<xref ref-type="bibr" rid="B36">Martin et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). In addition, <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al. (2021)</xref> detected strong signatures of positive selection in several genes of Rosaceae, including <italic>rpoA</italic>, <italic>rps16, rps18, psaA, psbL, rbcL, ndhD, ndhF, accD, ycf1</italic>, and <italic>ycf2</italic>. In particular, the <italic>rbcL</italic> gene encodes the large subunit of RuBisCO, which is one of the most useful enzymes for studying plant evolution, serving as a model protein in several studies owing to its response to environmental pressure and climate shifts (<xref ref-type="bibr" rid="B20">Hermida-Carrera et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). In addition to <italic>rbcL</italic>, <italic>ndhF</italic>, <italic>ycf1</italic>, and <italic>rps18</italic> had high <italic>Pi</italic> values in this study, which can help Rosaceae woody fruit trees efficiently capture light energy to obtain sufficient nutrition for growth and development as an adaptation under extreme and variable environmental conditions (<xref ref-type="supplementary-material" rid="SM2">
<bold>Table S2</bold>
</xref>). Hence, it is necessary to further study the patterns of synonymous and non-synonymous substitutions among <italic>Cerasus</italic> species, which can provide new insight into the evolution of Rosaceae.</p>
<p>The subgenus <italic>Cerasus</italic> can be classified in two sections of true cherry (<italic>Cerasus sensu stricto</italic>) and dwarf cherry (<italic>Microcerasus</italic>), according to <xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al. (1986)</xref>. The genetic evolution of <italic>Cerasus</italic> species has been a long-standing open research question (<xref ref-type="bibr" rid="B32">Liang et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). Given its maternal inheritance, the cp genome has been widely used for species classification and evolutionary analyses (<xref ref-type="bibr" rid="B53">Wang et&#xa0;al., 2022</xref>). Therefore, we reconstructed the <italic>Cerasus</italic> phylogenetic tree based on the complete cp genome (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). In line with the classification proposed by <xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al. (1986)</xref> and others, true cherry species were classified in a single group as clade I (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). Surprisingly, <italic>P. tianshanica</italic>, as a <italic>Microcerasus</italic> species, also clustered in the true cherry group and formed a clade with <italic>P. cerasus</italic>, <italic>P. fruticosa</italic>, <italic>P. cerasus</italic> &#xd7; <italic>P. canescens</italic> &#x2018;Gisela 6&#x2019;, and <italic>P. avium</italic>. Moreover, <italic>P. mahaleb</italic> in clade I was separated from other true cherry species, which is in line with previous reports (<xref ref-type="bibr" rid="B10">Chin et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). Further subdivisions of true cherry match the existing classification (<xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al., 1986</xref>; <xref ref-type="bibr" rid="B56">Webster and Looney, 1996</xref>) proposing <italic>P. mahaleb</italic> or <italic>P. emarginata</italic>, <italic>P. pennsylvanica</italic>, and <italic>P. prunifolia</italic> as a separate group, named section <italic>Mahaleb</italic> Focke (<xref ref-type="supplementary-material" rid="SM7">
<bold>Table S7</bold>
</xref>). However, in the present study, <italic>P. emarginata</italic> was not grouped with <italic>P. mahaleb</italic> (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). In addition, we found that some true cherry species did not follow the grouping of existing classifications (<xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al., 1986</xref>; <xref ref-type="bibr" rid="B56">Webster and Looney, 1996</xref>) or varied to a certain extent at the section level, such as <italic>P. tianshanica</italic>, <italic>P. serrula</italic>, and <italic>P. serrulata</italic> (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM7">
<bold>Table S7</bold>
</xref>). <italic>Microcerasus</italic> also showed a significant difference from other taxa (<xref ref-type="supplementary-material" rid="SM7">
<bold>Table S7</bold>
</xref>) (<xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al., 1986</xref>; <xref ref-type="bibr" rid="B56">Webster and Looney, 1996</xref>), which were grouped with <italic>Amygdalus, Armeniaca</italic>, and <italic>Prunus</italic> as a subclade in this study (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). These relationships were also reported in previous studies (<xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B31">Li et&#xa0;al., 2022</xref>). <italic>Microcerasus</italic> showed close evolutionary relationships to <italic>Amygdalus</italic> (<italic>P. tenella</italic>, <italic>P. pedunculata</italic>, and <italic>P. triloba</italic>) and <italic>Armeniaca</italic> (<italic>P. mume</italic>, <italic>P. mandshurica</italic>, and <italic>P. armeniaca</italic>) species. Specifically, <italic>P. japonica</italic> and <italic>P. tomentosa</italic> were the closest relatives to <italic>Amygdalus</italic> (<italic>P. triloba</italic> and <italic>P. pedunculata</italic>). Previous studies also revealed that <italic>P. pesica</italic> in <italic>Amygdalus</italic> was closely related to <italic>Microcerasus</italic> (<xref ref-type="bibr" rid="B9">Chen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B54">Wang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>). Hence, during the evolution process, true cherry formed a distinct group, while <italic>Microcerasus</italic> remained genetically closer to <italic>Amygdalus</italic>, <italic>Armeniaca</italic>, and <italic>Prunus</italic> (<italic>sensu stricto</italic>) than to true cherry. These results can be supported by multi-cp genome comparative (<xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2021</xref>) and whole-genome analyses (<xref ref-type="bibr" rid="B54">Wang et&#xa0;al., 2020</xref>). Nevertheless, further breakdown of <italic>Cerasus</italic> (<italic>sensu stricto</italic>) should not be ignored based on these results, which contrast with the existing classification criteria (<xref ref-type="bibr" rid="B61">Y&#xfc; et&#xa0;al., 1986</xref>; <xref ref-type="bibr" rid="B56">Webster and Looney, 1996</xref>). Accordingly, further study of the taxa of the subgenus <italic>Cerasus</italic>, especially <italic>Microcerasus</italic>, is necessary to enable breeding novel cherry cultivars and to gain a better understanding of the evolution of <italic>Prunus sensu lato</italic> specifically and Rosaceae plants more broadly.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusion">
<label>5</label>
<title>Conclusion</title>
<p>Comparative analysis of the cp genome is a key approach to study the molecular evolution and reconstruct the phylogenetic tree of <italic>Cerasus</italic> species. The present analysis of the cp genomes of 11 <italic>Cerasus</italic> species showed that IR regions are more strongly conserved than the LSC and SSC regions, whereas the non-coding sequences showed more significant divergence than the coding regions. The contraction/expansion of <italic>rps19</italic> and <italic>ndhF</italic> at the IR boundaries were the main contributors to the observed variation among <italic>Cerasus</italic> cp genomes, as well as variation in <italic>ycf1</italic> and <italic>trnH</italic>. We identified 26 genes and IGRs with variations that can be used as potential molecular markers and candidate DNA barcodes for studying the phylogeny and phylogeography of cherry species. We further provided important evidence that <italic>P. mahaleb</italic> forms a unique clade among true cherry (<italic>Cerasus sensu stricto</italic>) due to plastid genome rearrangement. <italic>Microcerasus</italic> was found to be genetically closer to <italic>Amygdalus</italic>, <italic>Armeniaca</italic>, and <italic>Prunus</italic> (<italic>sensu stricto</italic>) than to true cherry species. Moreover, <italic>P. tianshanica</italic> emerged as a noteworthy species given its close relationship to <italic>P. avium</italic>. Overall, these findings provide new insight and resources to breed novel cultivated sweet cherry and cherry rootstock in the future.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>TW and Y-LC designed the research. TW performed the experiments and analyzed the data. Y-LC identified the plant materials and revised the manuscript. B-XQ, JZ, and K-SS revised the manuscript. FA assembled the sequences. TW, B-XQ, JZ, L-YP, and FA annotated the plastomes. TW, K-SS, L-YP, X-SH, TL, and P-KL collected the plant materials. FA and L-YP provided analysis support. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>This work was financially supported by the Bingtuan Science and Technology Program (Grant number: 2021AB017) and the Agricultural Science and Technology Innovation and Transformation Project of Shaanxi province (Grant number: NYKJ-2022-YL(XN)47). The funders had no role in study design, data collection, data analysis, data interpretation, the writing of the manuscript, or decision to publish.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We are grateful to Associate Professor Zengqiang Qian from College of Life Sciences, Shaanxi Normal University, and Guoqing Bai from Xi&#x2019;an Botanical Garden of Shaanxi Province (Institute of Botany of Shaanxi Province Shaanxi) and Engineering Research Centre for Conservation and Utilization of Botanical Resources for their useful advice and help in data analyses.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2023.1070600/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2023.1070600/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SF1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table_1.xlsx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_2.xlsx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_3.xlsx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_4.xlsx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_5.xlsx" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_6.xlsx" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Table_7.xlsx" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alzahrani</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Yaradua</surname> <given-names>S. S.</given-names>
</name>
<name>
<surname>Albokhari</surname> <given-names>E. J.</given-names>
</name>
<name>
<surname>Abba</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Complete chloroplast genome sequence of <italic>Barleria prionitis</italic>, comparative chloroplast genomics and phylogenetic relationships among acanthoideae</article-title>. <source>BMC Genomics</source> <volume>21</volume>, <fpage>393</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-020-06798-2</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Amiryousefi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hyvonen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Poczai</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>IRscope: an online program to visualize the junction sites of chloroplast genomes</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>3030</fpage>&#x2013;<lpage>3031</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty220</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bao</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Ao</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Wuyun</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The complete chloroplast genome of <italic>Prunus mira</italic> koehne (Prunoideae, rosaceae), a wild and indigenous peach on Tibet, China</article-title>. <source>Mitochond. DNA B</source> <volume>4</volume>, <fpage>3731</fpage>&#x2013;<lpage>3733</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2019.1679048</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beier</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Thiel</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Munch</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Scholz</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Mascher</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>MISA-web: A web server for microsatellite prediction</article-title>. <source>Bioinformatics</source> <volume>33</volume>, <fpage>2583</fpage>&#x2013;<lpage>2585</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btx198</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bortiri</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Baggett</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Granger</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Weeks</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>Phylogeny and systematics of <italic>Prunus</italic> (Rosaceae) as determined by sequence analysis of ITS and the chloroplast trnL-trnF spacer DNA</article-title>. <source>Syst. Bot.</source> <volume>26</volume>, <fpage>797</fpage>&#x2013;<lpage>807</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1043/0363-6445-26.4.797</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brudno</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Malde</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Poliakov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Do</surname> <given-names>C. B.</given-names>
</name>
<name>
<surname>Couronne</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Dubchak</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2003</year>). <article-title>Glocal alignment: finding rearrangements during alignment</article-title>. <source>Bioinformatics</source> <volume>19 Suppl 1</volume>, <fpage>i54</fpage>&#x2013;<lpage>i62</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btg1005</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>B. Y.</given-names>
</name>
<name>
<surname>Mak</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Lowe</surname> <given-names>T. M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>tRNAscan-SE 2.0: improved detection and functional classification of transfer RNA genes</article-title>. <source>Nucleic Acids Resour.</source> <volume>49</volume>, <fpage>9077</fpage>&#x2013;<lpage>9096</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkab688</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chavez</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Beckman</surname> <given-names>T. G.</given-names>
</name>
<name>
<surname>Chaparro</surname> <given-names>J. X.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Identifying the north American plum species phylogenetic signal using nuclear, mitochondrial, and chloroplast DNA markers</article-title>. <source>J. Am. Soc Hortic. Sci.</source> <volume>141</volume>, <fpage>623</fpage>&#x2013;<lpage>644</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.21273/jashs03875-16</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>H. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>The complete chloroplast genome of tomentosa cherry <italic>Prunus tomentosa</italic> (Prunoideae, rosaceae)</article-title>. <source>Mitochond. DNA B</source> <volume>3</volume>, <fpage>672</fpage>&#x2013;<lpage>673</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2018.1476068</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chin</surname> <given-names>S. W.</given-names>
</name>
<name>
<surname>Shaw</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Haberle</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wen</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Potter</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Diversification of almonds, peaches, plums and cherries - molecular systematics and biogeographic history of <italic>Prunus</italic> (Rosaceae)</article-title>. <source>Mol. Phylogen. Evol.</source> <volume>76</volume>, <fpage>34</fpage>&#x2013;<lpage>48</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2014.02.024</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Daniell</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>C. S.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>W. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Chloroplast genomes: diversity, evolution, and applications in genetic engineering</article-title>. <source>Genome Biol.</source> <volume>17</volume>, <fpage>134</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-016-1004-2</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Decroocq</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Hagen</surname> <given-names>L. S.</given-names>
</name>
<name>
<surname>Fav&#xe9;</surname> <given-names>M.-G.</given-names>
</name>
<name>
<surname>Eyquard</surname> <given-names>J.-P.</given-names>
</name>
<name>
<surname>Pierronnet</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Microsatellite markers in the hexaploid <italic>Prunus domestica</italic> species and parentage lineage of three European plum cultivars using nuclear and chloroplast simple-sequence repeats</article-title>. <source>Mol. Breed.</source> <volume>13</volume>, <fpage>135</fpage>&#x2013;<lpage>142</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/B:MOLB.0000018761.04559.b3</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dunning</surname> <given-names>L. T.</given-names>
</name>
<name>
<surname>Olofsson</surname> <given-names>J. K.</given-names>
</name>
<name>
<surname>Papadopulos</surname> <given-names>A. S. T.</given-names>
</name>
<name>
<surname>Hibdige</surname> <given-names>S. G. S.</given-names>
</name>
<name>
<surname>Hidalgo</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Leitch</surname> <given-names>I. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Hybridisation and chloroplast capture between distinct themeda triandra lineages in Australia</article-title>. <source>Mol. Ecol</source> <volume>31</volume>, <fpage>5846</fpage>&#x2013;<lpage>5860</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/mec.16691</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X. Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>B. B.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Cai1</surname> <given-names>Y. L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Characterization of the complete chloroplast genome of the Chinese cherry <italic>Prunus pseudocerasus</italic> (Rosaceae)</article-title>. <source>Conserv. Genet. Resour.</source> <volume>10</volume>, <fpage>85</fpage>&#x2013;<lpage>88</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s12686-017-0770-9</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frazer</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Pachter</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Poliakov</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rubin</surname> <given-names>E. M.</given-names>
</name>
<name>
<surname>Dubchak</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>VISTA: Computational tools for comparative genomics</article-title>. <source>Nucleic Acids Res.</source> <volume>32</volume>, <fpage>W273</fpage>&#x2013;<lpage>W279</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkh458</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greiner</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lehwark</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>OrganellarGenomeDRAW (OGDRAW) version 1.3.1: Expanded toolkit for the graphical visualization of organellar genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>W59</fpage>&#x2013;<lpage>W64</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkz238</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greiner</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rauwolf</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Meurer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Herrmann</surname> <given-names>R. G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The role of plastids in plant speciation</article-title>. <source>Mol. Ecol.</source> <volume>20</volume>, <fpage>671</fpage>&#x2013;<lpage>691</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-294X.2010.04984.x</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hahn</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Bachmann</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Chevreux</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Reconstructing mitochondrial genomes directly from genomic next-generation sequencing reads-a baiting and iterative mapping approach</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>, <elocation-id>e129</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkt371</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heinze</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Five complete chloroplast genome sequences from <italic>Diospyros</italic>: Genome organization and comparative analysis</article-title>. <source>PloS One</source> <volume>11</volume>, <elocation-id>e0159566</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0159566</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hermida-Carrera</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Fares</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Fernandez</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Gil-Pelegrin</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Kapralov</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Mir</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Positively selected amino acid replacements within the RuBisCO enzyme of oak trees are associated with ecological adaptations</article-title>. <source>PloS One</source> <volume>12</volume>, <elocation-id>e0183970</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0183970</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Tan</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Liao</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>The chloroplast genome of <italic>Prunus zhengheensis</italic>: Genome comparative and phylogenetic relationships analysis</article-title>. <source>Gene</source> <volume>793</volume>, <elocation-id>145751</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.gene.2021.145751</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huelsenbeck</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Ronquist</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>MRBAYES: Bayesian inference of phylogenetic trees</article-title>. <source>Bioinformatics</source> <volume>17</volume>, <fpage>754</fpage>&#x2013;<lpage>755</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/17.8.754</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ikemura</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>Codon usage and tRNA content in unicellular and multicellular organisms</article-title>. <source>Mol. Biol. Evol.</source> <volume>2</volume>, <fpage>13</fpage>&#x2013;<lpage>34</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a040335</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ivanova</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Sablok</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Daskalova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Zahmanova</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Apostolova</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Yahubyan</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Chloroplast genome Analysis of resurrection tertiary relict <italic>Haberlea rhodopensis</italic> highlights genes important for desiccation stress response</article-title>. <source>Front. Plant Sci.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2017.00204</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kearse</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Moir</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Wilson</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Stones-Havas</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cheung</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sturrock</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title>Geneious basic: An integrated and extendable desktop software platform for the organization and analysis of sequence data</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>1647</fpage>&#x2013;<lpage>1649</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bts199</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khan</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Spiroides shrubs on qinghai-Tibetan plateau: Multilocus phylogeography and palaeodistributional reconstruction of <italic>Spiraea alpina</italic> and <italic>S. mongolica</italic> (Rosaceae)</article-title>. <source>Mol. Phylogen. Evol.</source> <volume>123</volume>, <fpage>137</fpage>&#x2013;<lpage>148</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ympev.2018.02.009</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kimura</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>The neutral theory of molecular evolution and the world view of the neutralists</article-title>. <source>Genome</source> <volume>31</volume>, <fpage>24</fpage>&#x2013;<lpage>31</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1139/g89-009</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Stecher</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Tamura</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>MEGA7: Molecular evolutionary genetics analysis version 7.0 for bigger datasets</article-title>. <source>Mol. Biol. Evol.</source> <volume>33</volume>, <fpage>1870</fpage>&#x2013;<lpage>1874</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msw054</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kurtz</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Choudhuri</surname> <given-names>J. V.</given-names>
</name>
<name>
<surname>Ohlebusch</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Schleiermacher</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Stoye</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Giegerich</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>REPuter: The manifold applications of repeat analysis on a genomic scale</article-title>. <source>Nucleic Acids Res.</source> <volume>29</volume>, <fpage>4633</fpage>&#x2013;<lpage>4642</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/29.22.4633</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Letunic</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Bork</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Interactive tree of life (iTOL) v5: An online tool for phylogenetic tree display and annotation</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>W293</fpage>&#x2013;<lpage>W296</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkab301</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Nie</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Xiong</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>The complete chloroplast genome of <italic>Prunus clarofolia</italic> (Rosaceae), a wild cherry endemic to China</article-title>. <source>MITOCHONDRIAL DNA Part B</source> <volume>7</volume>, <fpage>164</fpage>&#x2013;<lpage>166</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2021.2016080</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wan</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Molecular identification and genetic analysis of cherry cultivars using capillary electrophoresis with fluorescence-labeled SSR markers</article-title>. <source>3 Biotech.</source> <volume>8</volume>, <fpage>16</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s13205-017-1036-7</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Schwarzacher</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Heslop-Harrison</surname> <given-names>J. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Comparative chloroplast genome analyses of <italic>Avena</italic>: Insights into evolutionary dynamics and phylogeny</article-title>. <source>BMC Plant Biol.</source> <volume>20</volume>, <fpage>406</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-020-02621-y</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>L.-X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Worth</surname> <given-names>J. R. P.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Cameron</surname> <given-names>K. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>The complete chloroplast genome of Chinese bayberry <italic>(Morella rubra</italic>, myricaceae): Implications for understanding the evolution of fagales</article-title>. <source>Front. Plant Sci.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2017.00968</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marechal</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Brisson</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Recombination and the maintenance of plant organelle genome stability</article-title>. <source>New Phytol.</source> <volume>186</volume>, <fpage>299</fpage>&#x2013;<lpage>317</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1469-8137.2010.03195.x</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martin</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Funk</surname> <given-names>H. T.</given-names>
</name>
<name>
<surname>Serrot</surname> <given-names>P. H.</given-names>
</name>
<name>
<surname>Poltnigg</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Sabater</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Functional characterization of the thylakoid ndh complex phosphorylation by site-directed mutations in the <italic>ndhF</italic> gene</article-title>. <source>Biochim. Biophys. Acta</source> <volume>1787</volume>, <fpage>920</fpage>&#x2013;<lpage>928</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.bbabio.2009.03.001</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mcdonald</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W. C.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>H. D.</given-names>
</name>
<name>
<surname>Leu</surname> <given-names>J. Y.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Clusters of nucleotide substitutions and insertion/deletion mutations are associated with repeat sequences</article-title>. <source>PloS Biol.</source> <volume>9</volume>, <elocation-id>e1000622</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pbio.1000622</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Bell</surname> <given-names>C. D.</given-names>
</name>
<name>
<surname>Burleigh</surname> <given-names>J. G.</given-names>
</name>
<name>
<surname>Soltis</surname> <given-names>D. E.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Phylogenetic analysis of 83 plastid genes further resolves the early diversification of eudicots</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A</source> <volume>107</volume>, <fpage>4623</fpage>&#x2013;<lpage>4628</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0907801107</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morton</surname> <given-names>B. R.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Selection on the codon bias of chloroplast and cyanelle genes in different plant and algal lineages</article-title>. <source>J. Mol. Evol.</source> <volume>46</volume>, <fpage>449</fpage>&#x2013;<lpage>459</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/PL00006325</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murray</surname> <given-names>M. G.</given-names>
</name>
<name>
<surname>Thompson</surname> <given-names>W. F</given-names>
</name>
</person-group> (<year>1980</year>). <article-title>Rapid isolation of higher weight DNA</article-title>. <source>Nucleic Acids Res</source> <volume>8</volume>, <fpage>4321</fpage>&#x2013;<lpage>4325</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/8.19.4321</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murray</surname> <given-names>E. E.</given-names>
</name>
<name>
<surname>Lotzer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Eberle</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Codon usage in plant genes</article-title>. <source>Nucleic Acids Res.</source> <volume>17</volume>, <fpage>477</fpage>&#x2013;<lpage>498</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/17.2.477</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>Comparative organaization of chloroplast genomes</article-title>. <source>Annu. Rev. Genet.</source> <volume>19</volume>, <fpage>325</fpage>&#x2013;<lpage>354</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.ge.19.120185.001545</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Potter</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Eriksson</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Evans</surname> <given-names>R. C.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Smedmark</surname> <given-names>J. E. E.</given-names>
</name>
<name>
<surname>Morgan</surname> <given-names>D. R.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>Phylogeny and classification of rosaceae</article-title>. <source>Plant Syst. Evol.</source> <volume>266</volume>, <fpage>5</fpage>&#x2013;<lpage>43</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00606-007-0539-9</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ravi</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Khurana</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Tyagi</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>Khurana</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>An update on chloroplast genomes</article-title>. <source>Plant Syst. Evol.</source> <volume>271</volume>, <fpage>101</fpage>&#x2013;<lpage>122</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00606-007-0608-0</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rozas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Ferrer-Mata</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sanchez-Delbarrio</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Guirao-Rico</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Librado</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Ramos-Onsins</surname> <given-names>S. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>DnaSP 6: DNA sequence polymorphism analysis of Large data sets</article-title>. <source>Mol. Biol. Evol.</source> <volume>34</volume>, <fpage>3299</fpage>&#x2013;<lpage>3302</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msx248</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sevindik</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Murathan</surname> <given-names>Z. T.</given-names>
</name>
<name>
<surname>Sevindik</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Molecular genetic diversity of <italic>Prunus armeniaca</italic> l. (Rosaceae) genotypes by RAPD, ISSR-PCR, and chloroplast DNA (cpDNA) trnL-f sequences</article-title>. <source>Int. J. Fruit S.</source> <volume>20</volume>, <fpage>S1652</fpage>&#x2013;<lpage>S1661</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/15538362.2020.1828223</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharp</surname> <given-names>P. M.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>W.-H.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>The codon adaptation index-a measure of directional synonymous codon usage bias, and its potential</article-title>. <source>Nucleic Acids Res.</source> <volume>15</volume>, <fpage>1281</fpage>&#x2013;<lpage>1295</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/15.3.1281</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaw</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Small</surname> <given-names>R. L.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Addressing the "hardest puzzle in American pomology:" phylogeny of <italic>Prunus</italic> sect. prunocerasus (Rosaceae) based on seven noncoding chloroplast DNA regions</article-title>. <source>Am. J. Bot.</source> <volume>91</volume>, <fpage>985</fpage>&#x2013;<lpage>996</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3732/ajb.91.6.985</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sugiura</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>The chloroplast genome</article-title>. <source>Plant Mol. Biol.</source> <volume>19</volume>, <fpage>149</fpage>&#x2013;<lpage>169</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/bf00015612</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uchoi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Malik</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Choudhary</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Rohini</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Pal</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Inferring phylogenetic relationships of Indian citron (<italic>Citrus medica</italic> l.) based on <italic>rbc</italic>L and <italic>mat</italic>K sequences of chloroplast DNA</article-title>. <source>Biochem. Genet.</source> <volume>54</volume>, <fpage>249</fpage>&#x2013;<lpage>269</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10528-016-9716-2</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Shang</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Sa</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The complete chloroplast genome of <italic>Prunus triloba</italic> var. <italic>plena</italic> and comparative analysis of <italic>Prunus</italic> species: genome structure, sequence divergence, and phylogenetic analysis</article-title>. <source>Braz. J. Bot.</source> <volume>44</volume>, <fpage>85</fpage>&#x2013;<lpage>95</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s40415-020-00685-6</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Kuang</surname> <given-names>R.-P.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.-H.</given-names>
</name>
<name>
<surname>Liang</surname> <given-names>X.-L.</given-names>
</name>
<name>
<surname>Wanga</surname> <given-names>V. O.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>K.-M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Complete chloroplast genome sequence of <italic>Fortunella venosa</italic> (Champ. ex benth.) C.C.Huang (Rutaceae): Comparative analysis, phylogenetic relationships, and robust support for its status as an independent species</article-title>. <source>Forests</source> <volume>12</volume>, <fpage>996</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/f12080996</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Han</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Identification of the complete chloroplast genome of <italic>Malus zhaojiaoensis</italic> jiang and its comparison and evolutionary analysis with other <italic>Malus</italic> species</article-title>. <source>Genes (Basel)</source> <volume>13</volume>, <fpage>560</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes13040560</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Yi</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Mu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Du</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Chromosome-level genome assembly of <italic>Cerasus humilis</italic> using PacBio and Hi-c technologies</article-title>. <source>Front. Genet.</source> <volume>11</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2020.00956</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Yu</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>KaKs_Calculator 2.0: A toolkit incorporating gamma-series methods and sliding window strategies</article-title>. <source>Genomics Proteomics Bioinf.</source> <volume>8</volume>, <fpage>77</fpage>&#x2013;<lpage>80</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/s1672-0229(10)60008-3</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Webster</surname> <given-names>A. D.</given-names>
</name>
<name>
<surname>Looney</surname> <given-names>N. E.</given-names>
</name>
</person-group> (<year>1996</year>). <source>CHERRIES: Crop physiology, production and uses</source> (<publisher-loc>Canbridge</publisher-loc>: <publisher-name>University Press</publisher-name>).</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wicke</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Schneeweiss</surname> <given-names>G. M.</given-names>
</name>
<name>
<surname>Depamphilis</surname> <given-names>C. W.</given-names>
</name>
<name>
<surname>M&#xfc;ller</surname> <given-names>K. F.</given-names>
</name>
<name>
<surname>Quandt</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The evolution of the plastid chromosome in land plants: gene content, gene order, gene function</article-title>. <source>Plant Mol. Biol.</source> <volume>76</volume>, <fpage>273</fpage>&#x2013;<lpage>297</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11103-011-9762-4</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xue</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Geng</surname> <given-names>F. D.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D. Q.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>L.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Divergence in the <italic>Aquilegia ecalcarata</italic> complex is correlated with geography and climate oscillations: Evidence from plastid genome data</article-title>. <source>Mol. Ecol.</source> <volume>30</volume>, <fpage>5796</fpage>&#x2013;<lpage>5813</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/mec.16151</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xue</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Shi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Ni</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Iqbal</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ni</surname> <given-names>Z.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Comparative analysis of the complete chloroplast genome among <italic>Prunus mume</italic>, <italic>P. armeniaca</italic>, and <italic>P. salicina</italic>
</article-title>. <source>Hortic. Res.</source> <volume>6</volume>, <fpage>89</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41438-019-0171-1</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Di</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Meng</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Phylogeography and evolution of two closely related oak species (<italic>Quercus</italic>) from north and northeast China</article-title>. <source>Tree Genet. Genom.</source> <volume>12</volume>, <fpage>89</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11295-016-1044-5</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Y&#xfc;</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>L. T.</given-names>
</name>
<name>
<surname>Ku</surname> <given-names>T. C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S. X.</given-names>
</name>
</person-group> (<year>1986</year>). <source>Flora of China</source> (<publisher-loc>Beijing</publisher-loc>: <publisher-name>Science Press</publisher-name>).</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zarei</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Erfani-Moghadam</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Mozaffari</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Phylogenetic analysis among some pome fruit trees of rosaceae family using RAPD markers</article-title>. <source>Biotechnol. Biotec. Eq.</source> <volume>31</volume>, <fpage>289</fpage>&#x2013;<lpage>298</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/13102818.2016.1276414</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Z. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Evolution of rosaceae plastomes highlights unique <italic>Cerasus</italic> diversification and independent origins of fruiting cherry</article-title>. <source>Front. Plant Sci.</source> <volume>12</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2021.736053</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Kanwal</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Completion of eight <italic>Gynostemma</italic> BL. (Cucurbitaceae) chloroplast genomes: Characterization, comparative analysis, and phylogenetic relationships</article-title>. <source>Front. Plant Sci.</source> <volume>8</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2017.01583</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Ziling</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The chloroplast genome of <italic>Prunus dielsiana</italic> (Rosaceae)</article-title>. <source>Mitochond. DNA B</source> <volume>4</volume>, <fpage>4033</fpage>&#x2013;<lpage>4034</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2019.1688723</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>