<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2018.00324</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Sequencing and Analysis of <italic>Strobilanthes cusia</italic> (Nees) Kuntze Chloroplast Genome Revealed the Rare Simultaneous Contraction and Expansion of the Inverted Repeat Region in Angiosperm</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Haimei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Shao</surname> <given-names>Junjie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Hui</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/519049/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Jiang</surname> <given-names>Mei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Huang</surname> <given-names>Linfang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/374429/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Zhao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Dan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>He</surname> <given-names>Molly</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ronaghi</surname> <given-names>Mostafa</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Luo</surname> <given-names>Xi</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Sun</surname> <given-names>Botao</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wu</surname> <given-names>Wuwei</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/486600/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Liu</surname> <given-names>Chang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/369616/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Key Laboratory of Bioactive Substances and Resource Utilization of Chinese Herbal Medicine, Ministry of Education, Institute of Medicinal Plant Development, Chinese Academy of Medical Sciences and Peking Union Medical College</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Illumina, Inc., San Diego</institution>, <addr-line>CA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Guangxi Botanical Garden of Medicinal Plants</institution>, <addr-line>Nanning</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <italic>TingFung Chan, The Chinese University of Hong Kong, Hong Kong</italic></p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <italic>Ren&#x00E9; Massimiliano Marsano, Universit&#x00E0; degli Studi di Bari Aldo Moro, Italy; J&#x00E1;nos Taller, University of Pannonia, Hungary</italic></p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x002A;Correspondence: <italic>Chang Liu, <email>cliu6688@yahoo.com</email>;, <email>cliu@implad.ac.cn</email></italic></p></fn>
<fn fn-type="other" id="fn002"><p><sup>&#x2020;</sup><italic>These authors have contributed equally to this work.</italic></p></fn>
<fn fn-type="other" id="fn003"><p>This article was submitted to Evolutionary and Population Genetics, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>03</month>
<year>2018</year>
</pub-date>
<pub-date pub-type="collection">
<year>2018</year>
</pub-date>
<volume>9</volume>
<elocation-id>324</elocation-id>
<history>
<date date-type="received">
<day>06</day>
<month>11</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>02</month>
<year>2018</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2018 Chen, Shao, Zhang, Jiang, Huang, Zhang, Yang, He, Ronaghi, Luo, Sun, Wu and Liu.</copyright-statement>
<copyright-year>2018</copyright-year>
<copyright-holder>Chen, Shao, Zhang, Jiang, Huang, Zhang, Yang, He, Ronaghi, Luo, Sun, Wu and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Ban-Lan-Gen, the root tissues derived from several morphologically indistinguishable plant species, have been used widely in traditional Chinese medicines for numerous years. The identification of reliable markers to distinguish various source plant species is critical for the effective and safe use of products containing Ban-Lan-Gen. Here, we analyzed and characterized the complete chloroplast (cp) genome sequence of <italic>Strobilanthes cusia</italic> (Nees) Kuntze to identify high-resolution markers for the species determination of Southern Ban-Lan-Gen. Total DNA was extracted and subjected to next-generation sequencing. The cp genome was then assembled, and the gaps were filled using PCR amplification and Sanger sequencing. Genome annotation was conducted using CpGAVAS web server. The genome was 144,133 bp in length, presenting a typical quadripartite structure of large (LSC; 91,666 bp) and small (SSC; 17,328 bp) single-copy regions separated by a pair of inverted repeats (IRs; 17,811 bp). The genome encodes 113 unique genes, including 79 protein-coding, 30 transfer RNA, and 4 ribosomal RNA genes. A total of 20 tandem, 2 forward, and 6 palindromic repeats were detected in the genome. A phylogenetic analysis based on 65 protein-coding genes showed that <italic>S. cusia</italic> was closely related to <italic>Andrographis paniculata</italic> and <italic>Ruellia breedlovei</italic>, which belong to the same family, Acanthaceae. One interesting feature is that the IR regions apparently undergo simultaneous contraction and expansion, resulting in the presence of single copies of rps19, rpl2, rpl23, and ycf2 in the LSC region and the duplication of psbA and trnH genes in the IRs. This study provides the first complete cp genome in the genus <italic>Strobilanthes</italic>, containing critical information for the classification of various <italic>Strobilanthes</italic> species in the future. This study also provides the foundation for precisely determining the plant sources of Ban-Lan-Gen.</p>
</abstract>
<kwd-group>
<kwd>Ban-Lan</kwd>
<kwd>Ban-Lan-Gen</kwd>
<kwd><italic>Strobilanthes cusia</italic> (Nees) Kuntze</kwd>
<kwd><italic>Baphicacanthus cusia</italic> (Nees) Bremek</kwd>
<kwd>chloroplast genome</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="55"/>
<page-count count="13"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p>Ban-Lan-Gen, the root tissues of several morphologically indistinguishable plant species known as Ban-Lan, is used in various traditional Chinese medicine (TCM) products for the treatment of viral hepatitis, influenza, cold, pneumonia, inflammation, herpes, erysipelas, and snakebite (<xref ref-type="bibr" rid="B3">Chinese Pharmacopoeia Commission, 2015</xref>). Chemical components with diverse structures, including indole alkaloids, quinazolinone alkaloids, monoterpenes, triterpenes, flavonoids, sterols, anthraquinones, benzoxazinones, and lignans, are derived from the extracts of Ban-Lan-Gen (<xref ref-type="bibr" rid="B13">Honda and Tabata, 1979</xref>; <xref ref-type="bibr" rid="B42">Sun et al., 2008</xref>; <xref ref-type="bibr" rid="B12">Gu et al., 2014</xref>). Pharmacological studies indicate that these components exert antimicrobial, antiviral, anticancer (<xref ref-type="bibr" rid="B31">Merz et al., 2004</xref>; <xref ref-type="bibr" rid="B15">Ichimaru et al., 2015</xref>), and anti-inflammatory effects (<xref ref-type="bibr" rid="B33">Otsuka et al., 1988</xref>).</p>
<p>Similar to those of numerous TCMs, the exact identities of the source plants of Ban-Lan-Gen are usually not well defined. Since 1995, Pharmacopoeia of the People&#x2019;s Republic of China has defined <italic>Isatis indigotica</italic> Fort as the source plant of Northern Ban-Lan-Gen and <italic>Baphicacanthus cusia</italic> (Nees) Bremek as the source plant of Southern Ban-Lan-Gen. However, people still use other plants as source of Ban-Lan-Gen. For example, according to Flora of China<sup><xref ref-type="fn" rid="fn01">1</xref></sup>, species including <italic>Strobilanthes cusia</italic> (Nees) Kuntze, <italic>Strobilanthes balansae</italic> Lindau, <italic>Ruellia indigotica</italic> Fortune, <italic>Ruellia indigofera</italic> Griff<italic>., Goldfussia cusia</italic> Nees, <italic>Dipteracanthus calycinus</italic> Champion ex Bentham, <italic>Strobilanthes championii</italic> T. Anderson, and <italic>Strobilanthes flaccidifolia</italic> Nees are all considered the aliases of <italic>B. cusia</italic> (Nees) Bremek. Another study stated that &#x201C;Ban-Lan-Gen is the common name for the dried roots of indigo plants, including <italic>Polygonum tinctorium</italic>, <italic>Isatis indigotica</italic>, <italic>Isatis tinctoria</italic>, and <italic>Strobilanthes cusia</italic>.&#x201D; (<xref ref-type="bibr" rid="B19">Kumagai et al., 2016</xref>) The confusion regarding source plants with the common name &#x201C;Ban-Lan&#x201D; has undermined the consistent chemical compositions for medicinal products that use Ban-Lan as its source materials, leading to serious problems in the efficacy and safety of the medicinal products. Therefore, the identification of molecular markers that can unambiguously distinguish the plant materials is critical for ensuring the beneficial effects of medicinal products, including &#x201C;Ban-Lan.&#x201D;</p>
<p><italic>S. cusia</italic> (Nees) Kuntze, also known as <italic>B. cusia</italic> (Nees) Bremek and commonly called Ban-Lan, is a member of the family Acanthaceae. This herbaceous plant is considered as the typical species for Southern Ban-Lan-Gen (Chinese Pharmacopoeia) and native to northeast India, Myanmar, Thailand, and Southern China. The plant has been widely used as a dye and the source of traditional herbal medicines (<xref ref-type="bibr" rid="B51">Wu et al., 2006</xref>). Whereas its roots are commonly known as Ban-Lan-Gen and used as medicinal materials, the stems and leaves of <italic>S. cusia</italic> are used as the dye known as indigo blue (<xref ref-type="bibr" rid="B27">Liu et al., 2014</xref>). However, the species identity of <italic>S. cusia</italic> is not well defined. The genus <italic>Strobilanthes</italic> contains approximately 400 species; their morphological characters are highly homoplasious, causing difficulty in further classification and differentiation of various <italic>Strobilanthes</italic> species. The lacks of suitable samples and sufficient sampling have also hindered the usage of molecular markers for the phylogenetic classification of <italic>Strobilanthes</italic> species.</p>
<p>The chloroplast (cp) is an organelle that sustains life on earth by converting solar energy to carbohydrates through photosynthesis and oxygen release. The cp genome is ideal for ecological, evolutionary, and diversity studies due to several biological properties, such as high copy numbers of the genome compared with the nuclear genome, conserved genome structure, uniparental inheritance, and low effective population sizes (<xref ref-type="bibr" rid="B49">Wicke et al., 2011</xref>). Thus, the sequencing of plastid locus is instrumental in improving our understanding of phylogenetic relationships (<xref ref-type="bibr" rid="B16">Jansen et al., 2007</xref>), phylogeographic patterns (<xref ref-type="bibr" rid="B10">Golden and Bain, 2000</xref>), species discrimination (<xref ref-type="bibr" rid="B32">Nock et al., 2011</xref>), hybridization (<xref ref-type="bibr" rid="B34">Palme et al., 2004</xref>), photosynthesis (<xref ref-type="bibr" rid="B24">Leister, 2003</xref>), and genome evolution (<xref ref-type="bibr" rid="B49">Wicke et al., 2011</xref>, <xref ref-type="bibr" rid="B48">2016</xref>) for particular taxonomic groups. Although single-gene regions are the workhorse for molecular phylogenetic studies, the move from analysis of single-gene regions, which can be amplified by polymerase chain reaction (PCR), to complete cp genome is important to provide subspecies or variety-level resolution and address previously unanswered questions. The presence of hyper-variable sites suggests that sequences derived from cp genome can potentially be used to discriminate closely related species (<xref ref-type="bibr" rid="B23">Lei et al., 2016</xref>). As a result, obtaining the cp genome sequences of plant materials used for Ban-Lan-Gen can likely determine the exact species for the materials.</p>
<p>At present, more than one thousand cp genome sequences have been deposited at the National Center for Biotechnology Information (NCBI), including all of the major lineages of the plant kingdom. However, only two complete cp genomes of Acanthaceae, namely <italic>Andrographis paniculata</italic> and <italic>Ruellia breedlovei</italic>, have been sequenced. Moreover, no cp genome is available for species from the <italic>Strobilanthes</italic> genus. In this study, we sequenced and assembled the complete cp genome of <italic>S. cusia</italic> to identify molecular markers that can be used to classify <italic>S. cusia</italic> and its closely related species and to understand their phylogenetic relationships. The genome was then subjected to detailed analysis to identify genes and repeat elements. One interesting feature of the cp genome is that the inverted repeat (IR) regions showed simultaneous contraction and expansion, which is a rather rare observation in angiosperms. In summary, results obtained in this study provided valuable information to elucidate the evolutionary history of species in Acanthaceae. In addition, these results laid the foundation for the precise determination of plant species for the materials used in Ban-Lan-Gen.</p>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Plant Material and DNA Purification</title>
<p>Fresh leaves of <italic>S. cusia</italic> from multiple individuals were collected from Guangxi Medicinal Plant Garden, Nanning, Guangxi, China and stored at 4&#x00B0;C for cp DNA isolation. <italic>S. cusia</italic> is not an endangered or protected species, and no specific permissions were required for collection. A voucher specimen was deposited at the Institute of Medicinal Plant Development, Beijing, China. Total DNA was extracted using a plant genomic DNA kit (Tiangen Biotech, Beijing, Co., Ltd.). DNA purity was evaluated using 1.0% agarose gel, and DNA concentration was measured using a Nanodrop spectrophotometer 2000 (Thermo Fisher Scientific, United States).</p>
</sec>
<sec><title>Genome Sequencing, Assembly, and Annotation</title>
<p>Further steps of library preparation were performed using a TruSeq DNA Sample Prep Kit (Illumina, Inc., United States) according to the manufacturer&#x2019;s instructions. The DNA was sheared to yield approximately 500 bp-long fragments for paired-end library construction. The library was sequenced on Illumina HiSeq 3000 (Illumina Inc.). In total, 9,912,889 paired-end reads (2 &#x00D7; 150 bp) were obtained.</p>
<p>We first downloaded 1,006 plastid genomes from GenBank in February 2016. These plastid genome sequences were used to search against Illumina paired-end reads using BLASTN with an E-value cutoff of 1e-5. The genome sequence of <italic>A. paniculata</italic> (Accession number: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="NC_022451">NC_022451</ext-link>) had the highest overall sequence similarity to the reads and was used as a reference for the downstream genome assembly.</p>
<p>AbySS (v1.5.2) (<xref ref-type="bibr" rid="B40">Simpson et al., 2009</xref>) and CLC Genomics Workbench (v7) was used for the <italic>de novo</italic> genome assembly. Using Gepard (<xref ref-type="bibr" rid="B17">Krumsiek et al., 2007</xref>), we identified 7 contigs from the assembly of contigs of AbySS and CLC Genomics Workbench, respectively, that nearly spanned the entire cp genome. All the 14 contigs were assembled using Seqman module of DNASTAR (v11.0). Then, we obtained only one sequence corresponding to the large single-copy (LSC), IR, and small single-copy (SSC) regions of <italic>S. cusia.</italic> Regions corresponding to the IR/SSC and IR/LSC boundaries were confirmed via direct PCR amplifications.</p>
<p>PCR amplifications were performed using the sequence-specific primers (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>) under the following conditions: pre-denaturation at 94&#x00B0;C for 2 min, 35 cycles of amplification at 94&#x00B0;C for 30 s, 55&#x00B0;C for 30 s, and 72&#x00B0;C for 30 s, followed by a final extension at 72&#x00B0;C for 2 min. The PCR reaction mixture contained 25 &#x03BC;L of Taq MasterMix (2 &#x00D7; ), 2 &#x03BC;L of forward primer (10 &#x03BC;M), 2 &#x03BC;L of reverse primer (10 &#x03BC;M), and purified cp DNA ( &#x003C; 1 &#x03BC;g). RNase-free water was added to a final reaction volume of 50 &#x03BC;L.</p>
<p>The CpGAVAS web service (<xref ref-type="bibr" rid="B26">Liu et al., 2012</xref>) was used to annotate the <italic>S. cusia</italic> cp genome. Cutoffs for the E-values of BLASTN and BLASTX were 1e-10. The number of top hits to be included in the reference gene sets for annotation after the pre-filtering step was 10. Meanwhile, tRNA genes were identified using tRNAscan-SE (<xref ref-type="bibr" rid="B29">Lowe and Eddy, 1997</xref>) and ARAGORN (<xref ref-type="bibr" rid="B21">Laslett and Canback, 2004</xref>). Manual corrections on the positions of the start and stop codons, and for the intron/exon boundaries were performed based on the entries in the cp genome database (<xref ref-type="bibr" rid="B5">Cui et al., 2006</xref>) using the Apollo program (<xref ref-type="bibr" rid="B22">Lee et al., 2009</xref>). Moreover, the circular cp genome map of <italic>S. cusia</italic> was drawn using OrganellarGenomeDRAW (<xref ref-type="bibr" rid="B28">Lohse et al., 2013</xref>). Furthermore, codon usage and GC content (that is, the percentage of Guanines and Cytosines) were analyzed using the Cusp and Compseq programs provided by EMBOSS (<xref ref-type="bibr" rid="B38">Rice et al., 2000</xref>). Final genome assembly and genome annotation results were deposited in the GenBank (accession number: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="MG874806">MG874806</ext-link>).</p>
</sec>
<sec><title>Repeat Sequence Analysis</title>
<p>Simple sequence repeats (SSRs) were detected using MISA Perl Script available at <ext-link ext-link-type="uri" xlink:href="http://pgrc.ipk-gatersleben.de/misa/">http://pgrc.ipk-gatersleben.de/misa/</ext-link> with the following thresholds: 8 repeat units for mononucleotide SSRs, 4 repeat units for di- and trinucleotide repeat SSRs, and 3 repeat units for tetra-, penta-, and hexanucleotide repeat SSRs. Tandem repeats were analyzed using Tandem Repeats Finder (<xref ref-type="bibr" rid="B1">Benson, 1999</xref>) with parameter settings of two for matches and seven for mismatches and indels. The minimum alignment score and maximum period size were set at 50 and 500, respectively. All the identified repeats were manually verified and nested, or redundant results were removed. REPuter (<xref ref-type="bibr" rid="B20">Kurtz et al., 2001</xref>) was employed to identify the IRs in <italic>S. cusia</italic> by forward versus reverse complement (palindromic) alignment. The minimal repeat size was set at 30 bp, and the cutoff for similarities among the repeat units was set at 90%.</p>
</sec>
<sec><title>Comparative Genome Analysis</title>
<p>Conserved sequences were identified between the cp genomes of <italic>Astragalus membranaceus</italic> and those of <italic>A. paniculata</italic> (NC_022451.2), <italic>R. breedlovei</italic> (KP300014.1), <italic>Tanaecium tetragonolobum</italic> (NC_027955.1), <italic>Dorcoceras hygrometricum</italic> (NC_016468.1), <italic>Salvia miltiorrhiza</italic> (NC_020431.1), <italic>Olea europaea</italic> (NC_013707.2), <italic>Sesamum indicum</italic> (NC_016433.2), and <italic>Scrophularia takesimensis</italic> (NC_026202.1) by using BLASTN with an E-value cutoff of 1e-10. The homologous regions and gene annotations were visualized using a web-based genome synteny viewer GSV (<xref ref-type="bibr" rid="B37">Revanna et al., 2011</xref>).</p>
</sec>
<sec><title>Comparison of IR Boundaries in the Angiosperm Plant</title>
<p>A total of 31 species were examined for expansion or contraction of the IR, representing 29 species from Lamiales and 2 species from Actinidiaceae. The annotations of these cp genomes were downloaded from RefSeq database.</p>
</sec>
<sec><title>Phylogenetic Analysis</title>
<p>A total of 28 complete cp DNA sequences belonging to the Lamiales order were obtained from RefSeq database. For the phylogenetic analysis, 65 protein sequences were shared among all these 31 species, and <italic>S. cusia</italic> was aligned using the CLUSTALW2 (v2.0.12) program. The 65 proteins included ATPA, ATPB, ATPE, ATPF, ATPH, ATPI, CCSA, CEMA, MATK, NDHA, NDHB, NDHC, NDHE, NDHF, NDHG, NDHH, NDHI, NDHJ, NDHK, PETA, PETD, PETG, PETL, PETN, PSAA, PSAB, PSAC, PSAI, PSAJ, PSBA, PSBC, PSBD, PSBE, PSBF, PSBH, PSBJ, PSBK, PSBL, PSBM, PSBN, PSBT, PSBZ, RBCL, RPL14, RPL2, RPL20, RPL22, RPL23, RPL32, RPL33, RPL36, RPOB, RPOC1, RPOC2, RPS11, RPS14, RPS15, RPS18, RPS2, RPS3, RPS7, RPS8, YCF2, YCF3, and YCF4 (Supplementary File <xref ref-type="supplementary-material" rid="SM1">1</xref>). The alignment was manually examined and adjusted. Then, the evolutionary history was inferred using the Maximum Likelihood method implemented in RaxML (v8.2.4) (<xref ref-type="bibr" rid="B43">Stamatakis, 2015</xref>). The detailed parameters were &#x201C;raxmlHPC-PTHREADS-SSE3 -f a -N 1000 -m PROTGAMMACPREV -x 551314260 -p 551314260 -o A_thaliana, N_tabacum -T 20&#x201D;. The tree with the highest log likelihood (-126826.029496) was shown. The significance level for the phylogenetic tree was assessed by bootstrap testing with 1000 replications. The bootstrap values exceeding 50% were shown next to the corresponding nodes.</p>
</sec>
</sec>
<sec><title>Results</title>
<sec><title>General Features of the <italic>S. cusia</italic> Cp Genome</title>
<p>The complete plastid genome of <italic>S. cusia</italic> is a circular molecule of 144,133 bp in length. The genome possesses an LSC region of 91,666 bp, separated from the 17,811 bp SSC region by two IRs, each at 17,328 bp (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). The genome was deposited in GenBank under accession number: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="MG874806">MG874806</ext-link>. A total of 113 genes are contained within the <italic>S. cusia</italic> cp genome, including 79 protein-coding genes, 30 tRNA genes, and 4 RNA genes (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). Five protein-coding and seven tRNA-coding genes are duplicated on the IR regions. The LSC region contains 64 protein-coding genes and 22 tRNA genes, whereas the SSC region contains 11 protein-coding genes and one tRNA gene. Fifteen and three genes in the <italic>S. cusia</italic> cp genome possess one and two introns, respectively. Compared with the genes of <italic>R. breedlovei</italic>, the two genes <italic>matk</italic> and <italic>ycf2</italic> are shorter at 453 and 663 bp, respectively, at the 5&#x2032;-end sequence. The sequences of <italic>ycf2</italic> and <italic>matk</italic> are confirmed via direct PCR amplifications and Sanger sequencing using the primers listed in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Gene map of <italic>S. cusia</italic> cp genome. Genes inside and outside of the circle are transcribed in the clockwise and counterclockwise directions, respectively. LSC, large single-copy region; SSC small single-copy region; IR, inverted repeat.</p></caption>
<graphic xlink:href="fpls-09-00324-g001.tif"/>
</fig>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Genes contained in the <italic>S. cusia</italic> cp genome (a total of 113 genes).</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Category for genes</th>
<th valign="top" align="left">Group of genes</th>
<th valign="top" align="left">Name of genes</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Ribosome RNA genes</td>
<td valign="top" align="left">rRNA genes</td>
<td valign="top" align="left"><italic>rrn16</italic> (IR), <italic>rrn23</italic> (IR), <italic>rrn4.5</italic> (IR), <italic>rrn5</italic> (IR)</td>
</tr>
<tr>
<td valign="top" align="left">Transfer RNA genes</td>
<td valign="top" align="left">tRNA genes</td>
<td valign="top" align="left">37 genes (8 contain introns, 7 in the IR regions)</td>
</tr>
<tr>
<td valign="top" align="left">Protein-coding genes</td>
<td valign="top" align="left">Large subunit of ribosome</td>
<td valign="top" align="left"><italic>rpl2</italic><sup>&#x2217;</sup>, <italic>rpl14</italic>, <italic>rpl16</italic><sup>&#x2217;</sup>, <italic>rpl20</italic>, <italic>rpl22</italic>, <italic>rpl23</italic>, <italic>rpl32</italic>, <italic>rpl33</italic>, <italic>rpl36</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Small subunit of ribosome</td>
<td valign="top" align="left"><italic>rps2</italic>, <italic>rps3</italic>, <italic>rps4</italic>, <italic>rps7</italic> (IR), <italic>rps8</italic>, <italic>rps11</italic>, <italic>rps12</italic> (IR<sup>&#x2217;</sup>), <italic>rps14</italic>, <italic>rps15</italic>, <italic>rps16</italic><sup>&#x2217;</sup>,<italic>rps18</italic>, <italic>rps19</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">DNA dependent RNA polymerase</td>
<td valign="top" align="left"><italic>rpoA</italic>, <italic>rpoB</italic>, <italic>rpoC1</italic><sup>&#x2217;</sup>, <italic>rpoC2</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunits of NADH-dehydrogenase</td>
<td valign="top" align="left"><italic>ndhA</italic><sup>&#x2217;</sup>, <italic>ndhB</italic><sup>&#x2217;</sup> (IR), <italic>ndhC</italic>, <italic>ndhD</italic>, <italic>ndhE</italic>, <italic>ndhF</italic>, <italic>ndhG</italic>, <italic>ndhH</italic>, <italic>ndhI</italic>, <italic>ndhJ</italic>, <italic>ndhK</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunits of cytochrome b/f complex</td>
<td valign="top" align="left"><italic>petA</italic>, <italic>petB</italic><sup>&#x2217;</sup>, <italic>petD</italic><sup>&#x2217;</sup>, <italic>petG</italic>, <italic>petL</italic>, <italic>petN</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunits of photosystem I</td>
<td valign="top" align="left"><italic>psaA</italic>, <italic>psaB</italic>, <italic>psaC</italic>, <italic>psaI</italic>, <italic>psaJ</italic>, <italic>ycf3</italic><sup>&#x2217;&#x2217;</sup></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunits of photosystem II</td>
<td valign="top" align="left"><italic>psbA</italic> (IR), <italic>psbB</italic>, <italic>psbC</italic>, <italic>psbD</italic>, <italic>psbE</italic>, <italic>psbF</italic>, <italic>psbH</italic>, <italic>psbI</italic>, <italic>psbJ</italic>, <italic>psbK</italic>, <italic>psbL</italic>, <italic>psbM</italic>, <italic>psbN</italic>, <italic>psbT</italic>, <italic>psbZ</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunit of rubisco</td>
<td valign="top" align="left"><italic>rbcL</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunits of ATP synthase</td>
<td valign="top" align="left"><italic>atpA</italic>, <italic>atpB</italic>, <italic>atpE</italic>, <italic>atp</italic>F<sup>&#x2217;</sup>, <italic>atpH</italic>, <italic>atpI</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Subunit of Acetyl-CoA-carboxylase</td>
<td valign="top" align="left"><italic>accD</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">c-type cytochrome synthesis gene</td>
<td valign="top" align="left"><italic>ccsA</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Envelop membrane protein</td>
<td valign="top" align="left"><italic>cemA</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Protease</td>
<td valign="top" align="left"><italic>clpP</italic><sup>&#x2217;&#x2217;</sup></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Translational initiation factor</td>
<td valign="top" align="left"><italic>infA</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Maturase</td>
<td valign="top" align="left"><italic>matK</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">Conserved open reading frames</td>
<td valign="top" align="left"><italic>ycf1</italic> (IR), <italic>ycf2</italic>, <italic>ycf4</italic></td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic><italic>Genes located on the IR regions are indicated by the (IR) symbol after the gene name. One and two asterisks after gene name reflect one and two introns contained in the gene, respectively. The rps12 transcript is trans-spliced.</italic></italic></attrib>
</table-wrap-foot>
</table-wrap>
<p>The overall GC content of the <italic>S. cusia</italic> cp genome is 38%. The GC content of the IR regions (46%) is higher than that of the LSC and SSC regions (37% and 32%). Overall, 49.4% of the <italic>S. cusia</italic> cp genome sequence is composed of genes that encode proteins. The overall GC content of the <italic>S. cusia</italic> cp genome is 38.38%, whereas that of the protein-coding regions is 38.00%. Within the protein-coding regions, the GC contents for the first, second, and third positions of codons are 46.17%, 38.51%, and 30.47%, respectively. The codon usage and codon-anticodon recognition patterns of the <italic>S. cusia</italic> cp genome are summarized in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S2</xref>. The 30 tRNA genes contain codons corresponding to all 20 amino acids that are necessary for protein biosynthesis.</p>
</sec>
<sec><title>Repeat and SSR Analysis</title>
<p>Simple Sequence Repeats are valuable molecular markers of high-degree variations within the same species; these markers have been used in population genetics and polymorphism investigations (<xref ref-type="bibr" rid="B54">Xue et al., 2012</xref>). We analyzed the occurrence, type, and distribution of SSRs in the <italic>S. cusia</italic> cp genome. In total, 160 SSRs were identified in <italic>S. cusia</italic> cp genome by using the software tool MISA (<bold>Table <xref ref-type="table" rid="T2">2</xref></bold>). Among these SSRs, the majority consisted of mono- and dinucleotide repeats, which were found 94 and 43 times, respectively. By contrast, tri- (10), tetra- (11), and pentanucleotide repeat sequences (2) were observed with lower frequency. Most mononucleotide repeat sequences consisted of A/T repeats (92.6%). Similarly, 55.8% of the dinucleotide repeat sequences consisted of AT/AT repeats (<bold>Table <xref ref-type="table" rid="T2">2</xref></bold>). These results are in agreement with the previous findings stating that the cp SSRs are generally composed of short poly-A or poly-T repeats and rarely contained tandem G or C repeats (<xref ref-type="bibr" rid="B18">Kuang et al., 2011</xref>).</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Numbers of SSRs identified in the cp genome of <italic>S. cusia.</italic></p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">SSR Repeat Type (Number of copies)</th>
<th valign="top" align="left">SSR Repeat Sequences</th>
<th valign="top" align="center" colspan="9">Number of Copies</th>
<th valign="top" align="center">Total</th>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left"></td>
<td valign="top" align="left" colspan="9"><hr/></td>
<td valign="top" align="left"></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left"></td>
<th valign="top" align="center">3</th>
<th valign="top" align="center">4</th>
<th valign="top" align="center">5</th>
<th valign="top" align="center">6</th>
<th valign="top" align="center">7</th>
<th valign="top" align="center">8</th>
<th valign="top" align="center">9</th>
<th valign="top" align="center">10</th>
<th valign="top" align="center">11</th>
<td valign="top" align="center"></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Mono-nucleotide (94)</td>
<td valign="top" align="left">A/T</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">87</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">C/G</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center">7</td>
</tr>
<tr>
<td valign="top" align="left">Di-nucleotide (43)</td>
<td valign="top" align="left">AC/GT</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AG/CT</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">15</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AT/AT</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">24</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">CG/CG</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Tri-nucleotide (10)</td>
<td valign="top" align="left">AAG/CTT</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AAT/ATT</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">9</td>
</tr>
<tr>
<td valign="top" align="left">Tetra-nucleotide (11)</td>
<td valign="top" align="left">AAAG/CTTT</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AAAT/ATTT</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AACT/AGTT</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AATC/ATTG</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AATG/ATTC</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left">AATT/AATT</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="left">Penta-nucleotide (2)</td>
<td valign="top" align="left">AAAAT/ATTTT</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The locations of SSRs in the cp genome are shown in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>. The corresponding locations were further classified as intergenic (IGS), exonic, and intronic regions. Several SSRs that were separated with distances less than 100 bp were considered together as a compound SSR. In total, 21 compound SSRs were identified. In terms of the distribution, 64, 46, and 18 repeats were located in the IGS, exon, and intron regions, respectively. In particular, two of them spanned over the IGS and CDS regions (repeats no. 51 and 101, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>).</p>
<p>By definition, SSRs possess a repeat unit size equal to or less than five. We analyzed repeats with unit sizes exceeding five by using software tool Tandem Repeats Finder and REPuter. The repeats were divided into two types: tandem repeats and dispersed repeats. Tandem repeats are defined as those with two or more adjacent, approximate copies of a pattern of nucleotides. In total, 20 tandem repeats with repeat unit size longer than 12 bp (included) were identified, with the overall percentage of similarities between the adjacent repeat units set to 60% (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S4</xref>). The repeat unit was enclosed with parentheses. Among them, 4, 14, and 2 repeats were located in the CDS, intergenic, and intron regions, respectively. In contrast to tandem repeats, dispersed repeats is defined as with two or more approximate copies of a pattern of nucleotides separated by a certain number of nucleotides. Dispersed repeats can be further divided into four types, namely, forward, reverse, complement, and palindromic repeats (<xref ref-type="bibr" rid="B20">Kurtz et al., 2001</xref>). In total, two forward repeats and six palindromic repeats were identified using REPuter with a total length cutoff of 30 bp (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S5</xref>). For the palindromic repeat, the complementary structures were shown using pairing parentheses. This large set of repeats provides a rich resource for the development of novel molecular markers and to understand the genome evolution in <italic>S. cusia</italic>.</p>
</sec>
<sec><title>Genes With Introns</title>
<p>Analysis of the genome revealed a total of 18 genes with introns (<bold>Table <xref ref-type="table" rid="T3">3</xref></bold>). Among the genes, the <italic>rps12</italic> is a trans-spliced gene; its 5&#x2032; end is located on the LSC region, and the 3&#x2032; end is located on the IR region. Two other genes, <italic>clpP</italic> and <italic>ycf3</italic>, presented two introns and three exons each. Nine genes, namely, <italic>atpF</italic>, <italic>ndhA</italic>, <italic>ndhB</italic>, <italic>petB</italic>, <italic>petD</italic>, <italic>rpl16</italic>, <italic>rpl2</italic>, <italic>rpoC1</italic>, and <italic>rps16</italic>, each with one intron, were identified. Finally, six tRNA genes with one intron and two exons each, namely, <italic>trnA</italic>-UGC, <italic>trnC</italic>-ACA, <italic>trnI</italic>-GAU, <italic>trnK</italic>-UUU, <italic>trnL</italic>-UAA, and <italic>trnS</italic>-CGA, were observed. The lengths of these introns range from 476 bp to 2391 bp, with the longest intron found in the <italic>trnK</italic>-UUU gene.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Length of intron and exon splitting genes in the <italic>S. cusia</italic> cp genome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Gene</th>
<th valign="top" align="center" colspan="5">Length (bp)</th>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left" colspan="5"><hr/></td>
</tr>
<tr>
<td valign="top" align="left"></td>
<th valign="top" align="center">Exon I</th>
<th valign="top" align="center">Intron I</th>
<th valign="top" align="center">Exon II</th>
<th valign="top" align="center">Intron II</th>
<th valign="top" align="center">Exon III</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>rps12<sup>&#x2217;</sup></italic></td>
<td valign="top" align="center">114</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">230</td>
<td valign="top" align="center">536</td>
<td valign="top" align="center">26</td>
</tr>
<tr>
<td valign="top" align="left"><italic>clpP</italic></td>
<td valign="top" align="center">71</td>
<td valign="top" align="center">736</td>
<td valign="top" align="center">297</td>
<td valign="top" align="center">605</td>
<td valign="top" align="center">229</td>
</tr>
<tr>
<td valign="top" align="left"><italic>ycf3</italic></td>
<td valign="top" align="center">124</td>
<td valign="top" align="center">722</td>
<td valign="top" align="center">230</td>
<td valign="top" align="center">703</td>
<td valign="top" align="center">153</td>
</tr>
<tr>
<td valign="top" align="left"><italic>atpF</italic></td>
<td valign="top" align="center">141</td>
<td valign="top" align="center">700</td>
<td valign="top" align="center">471</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>ndhA</italic></td>
<td valign="top" align="center">553</td>
<td valign="top" align="center">1092</td>
<td valign="top" align="center">539</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>ndhB</italic></td>
<td valign="top" align="center">870</td>
<td valign="top" align="center">586</td>
<td valign="top" align="center">756</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>petB</italic></td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">731</td>
<td valign="top" align="center">648</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>petD</italic></td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">672</td>
<td valign="top" align="center">526</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>rpl16</italic></td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">888</td>
<td valign="top" align="center">402</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>rpl2</italic></td>
<td valign="top" align="center">391</td>
<td valign="top" align="center">644</td>
<td valign="top" align="center">470</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>rpoC1</italic></td>
<td valign="top" align="center">432</td>
<td valign="top" align="center">847</td>
<td valign="top" align="center">1620</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>rps16</italic></td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">882</td>
<td valign="top" align="center">227</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnA-</italic>UGC</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">806</td>
<td valign="top" align="center">35</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnC-</italic>ACA</td>
<td valign="top" align="center">39</td>
<td valign="top" align="center">575</td>
<td valign="top" align="center">55</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnI-</italic>GAU</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">917</td>
<td valign="top" align="center">56</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnK-</italic>UUU</td>
<td valign="top" align="center">38</td>
<td valign="top" align="center">2391</td>
<td valign="top" align="center">35</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnL-</italic>UAA</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">476</td>
<td valign="top" align="center">49</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"><italic>trnS-</italic>CGA</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">685</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center"></td>
<td valign="top" align="center"></td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic><italic><sup>&#x2217;</sup>trans-spliced gene.</italic></italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec><title>Gene Loss</title>
<p>The loss of genes in cp genomes may result from the transfer of genes into the nuclear genome or the deletion of genes. To understand which genes may become indispensable during evolution, we performed hierarchical clustering of lost genes by using Ward&#x2019;s method among 29 species in the Lamiales order (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). As shown in <bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>, a total of 15 genes that have lost one gene in at least one species are clustered into five groups. The first group includes genes <italic>accD</italic> and <italic>ycf15</italic>, which are lost in three and two species, respectively. Genes <italic>psbB</italic> and <italic>ycf1</italic>, which are lost in <italic>R. breedlovei</italic>, are included in the second group. Genes <italic>psbI</italic> and <italic>rps19</italic>, which are lost in <italic>D. hygrometricum</italic>, are included in the third group. Genes <italic>rps12</italic> and <italic>infA</italic>, which are included in the fourth group, are lost in five species, including <italic>Hesperelaea palmeri</italic>, three <italic>O. europaea</italic> subsp. <italic>maroccana</italic>, and <italic>Olea woodiana</italic>. The last group includes seven genes, namely, <italic>clpP</italic>, <italic>ndhD</italic>, <italic>petB</italic>, <italic>rpl16</italic>, <italic>rpoA</italic>, <italic>rps16</italic>, and <italic>rps4</italic>, which are all lost in <italic>T. tetragonolobum.</italic> In <italic>S. cusia</italic>, only the <italic>ycf15</italic> gene is lost, indicating that the gene loss rate in <italic>S. cusia</italic> is lower than those in other species. The <italic>ycf15</italic> gene belongs to the PFAM protein family PF10705, in which its function remains unknown. In certain plant species, the <italic>ycf15</italic> gene is probably not a protein-coding gene because the proteins in these species possess premature stop codons (<xref ref-type="bibr" rid="B44">Steane, 2005</xref>). The loss of <italic>ycf15</italic> gene results in further undermining of the notion that <italic>ycf15</italic> plays important functions in the genome of <italic>S. cusia</italic>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Gene losses in the cp genomes of the Lamiales order.</p></caption>
<graphic xlink:href="fpls-09-00324-g002.tif"/>
</fig>
</sec>
<sec><title>Comparative Analysis of the Cp Genome Rearrangement</title>
<p>To identify the possible occurrence of genome rearrangement, we selected the cp genome sequences of <italic>S. cusia</italic> and eight other species belonging to Lamiales for synteny analyses. These eight species included <italic>A. paniculata</italic>, <italic>R. breedlovei</italic>, <italic>T. tetragonolobum</italic>, <italic>D. hygrometricum</italic>, <italic>S. miltiorrhiza</italic>, <italic>O. europaea</italic>, <italic>S. indicum</italic>, and <italic>S. takesimensis</italic>, which are members of the Acanthaceae, Bignoniaceae, Gesneriaceae, Lamiaceae, Oleaceae, Pedaliaceae, and Scrophulariaceae families, respectively (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). Members of the Orobanchaceae and Lentibulariaceae families were not included. Orobanchaceae are parasites; without chlorophyll, their cp genomes are considerably reduced both in size and gene content and suffer horizontal gene transfer from its host, gene loss, and gene pseudogenization (<xref ref-type="bibr" rid="B25">Li et al., 2013</xref>). An exclusive combination of losses and pseudogenization of the plastid NAD(P)H-dehydrogenase (<italic>ndh</italic>) gene complex was observed in the cp genome of the Lentibulariaceae family (<xref ref-type="bibr" rid="B39">Silva et al., 2016</xref>). Therefore, we did not discuss the species belonging to family Lentibulariaceae and Orobanchaceae in the phylogenetic analysis and IR contraction/extension analysis part. Pairwise cp genome comparison between <italic>S. cusia</italic> and the other eight cp genomes recovered a high degree of synteny (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). However, the <italic>S. cusia</italic> cp genome exhibits two unique features: first, the genes of <italic>psbA</italic> and <italic>trnH-</italic>GUG are duplicated in the <italic>S. cusia</italic> cp genome, which are located near the boundaries of the IRa-LSC, and IRb-LSC regions; second, the IR sequence of <italic>S. cusia</italic> is 17,328 bp in length, which is significantly shorter than those of <italic>A. paniculata</italic> (25,340 bp) and <italic>R. breedlovei</italic> (22,704 bp).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Comparative genomic analyses of <italic>S. cusia</italic> and eight other representative species of Lamiales. The cp genome of <italic>S. cusia</italic> was aligned with those of eight species. Each horizontal black line represents one genome. The species names are shown to the right of the corresponding line. The conserved regions are bridged by lines.</p></caption>
<graphic xlink:href="fpls-09-00324-g003.tif"/>
</fig>
</sec>
<sec><title>Phylogenetic Analysis of <italic>S. cusia</italic> Based on Conserved Protein Sequences</title>
<p>By far, only two cp genomes have been completely sequenced for species from Acanthaceae, a family under the order Lamiales. To determine the phylogenetic position of <italic>S. cusia</italic> in Lamiales, we obtained 29 complete cp genome sequences belonging to the Lamiales from the RefSeq database (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S6</xref>). The distributions of the 29 species among different families are as follows: Lamiaceae (16), Bignoniaceae (1), Acanthaceae (3), Gesneriaceae (1), Oleaceae (6), Pedaliaceae (1), and Scrophulariaceae (1), with the number shown in the enclosed parentheses representing the number of species in the corresponding clade. We extracted 65 protein sequences present among the 29 cp genomes and those of <italic>Nicotiana tabacum</italic> and <italic>Arabidopsis thaliana</italic>, which served as the outgroup taxa. Multiple sequence alignment of the amino acid sequences resulted in a total of 19,277 positions in the final dataset. The phylogenetic tree was constructed using the Maximum Likelihood method and is shown in <bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>. The closest sister species of <italic>S. cusia</italic> are <italic>R. breedlovei</italic> and <italic>A. paniculata</italic> in Acanthaceae, (bootstrap values: 100%), and this finding was consistent with the expected relationships.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Molecular phylogenetic analyses of cp genomes in the Lamiales order. The tree was constructed with the sequences of 65 proteins present in 31 species (<italic>A. paniculata</italic>, <italic>R. breedlovei</italic>, <italic>T. tetragonolobum</italic>, <italic>D. hygrometricum</italic>, <italic>H. haplostachya</italic>, <italic>L. angustifolia</italic>, <italic>Phyllostegia velutina</italic>, <italic>Premna microphylla</italic>, <italic>R. officinalis</italic>, <italic>S. miltiorrhiza</italic>, <italic>S. baicalensis</italic>, <italic>S. insignis</italic>, <italic>S. byzantina</italic>, <italic>S. chamissonis</italic>, <italic>S. coccinea</italic>, <italic>S. sylvatica</italic>, <italic>S. bifida</italic>, <italic>S. haliakalae</italic>, <italic>S. kanehoana</italic>, <italic>T. grandis</italic>, <italic>H. palmeri</italic>, J. <italic>nudiflorum</italic>, <italic>O. europaea</italic>, <italic>O. europaea</italic> subsp. Cuspidata, <italic>O. europaea</italic> subsp. Maroccana, <italic>O. woodiana</italic> subsp. <italic>woodiana</italic>, <italic>S. indicum</italic>, <italic>S. takesimensis</italic>, <italic>Strobilanthes cusia</italic>, <italic>A. thaliana</italic>, and <italic>N. tabacum</italic>) using the Maximum Likelihood method implemented in RAxML. Two taxa, <italic>N. tabacum</italic> and <italic>A. thaliana</italic>, were used as outgroups. Tribes to which each species belongs are shown to the right side of the tree. Bootstrap supports were calculated from 1000 replicates.</p></caption>
<graphic xlink:href="fpls-09-00324-g004.tif"/>
</fig>
</sec>
<sec><title>IR Contraction/Extension Analysis of the Angiosperms</title>
<p>One distinct feature of the <italic>S. cusia</italic> cp genome is its IR length of 17,328 bp, which is significantly shorter than those of most angiosperms [ca. 20&#x2013;28 kb, (<xref ref-type="bibr" rid="B4">Chumley et al., 2006</xref>)]. The shortening of the IR region suggests the occurrence of an IR contraction event. By contrast, the IRs of <italic>S. cusia</italic> spanned to include the <italic>trnH</italic> and <italic>psbA</italic> genes, indicating the occurrence of another IR expansion event. To identify any potential evolutionary events, we analyzed the gene contents at the border areas in detail. The regions around the IR-LSC and IR-SSC borders extending from all the available cp genomes in Lamiales were analyzed, except those from the family Lentibulariaceae (the bladderwort family) and Orobanchaceae (a family of parasitic plants) (<bold>Figure <xref ref-type="fig" rid="F5">5A</xref></bold>). <italic>S. cusia</italic> is the only species in the Lamiales with an SSC region containing two copies of the <italic>trn</italic>H genes and two partial <italic>psb</italic>A genes. To determine the uniqueness of this pattern, we searched the SSC regions of all cp genomes and identified three species, <italic>Coriandrum sativum</italic>, <italic>Actinidia deliciosa</italic>, and <italic>Actinidia chinensis</italic>, whose SSC regions contain two copies of the <italic>trn</italic>H and <italic>psbA</italic> genes (<bold>Figure <xref ref-type="fig" rid="F5">5B</xref></bold>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Comparison of IR contents <bold>(A)</bold> between <italic>S. cusia</italic> and several representative cp genomes from Lamiales and <bold>(B)</bold> between <italic>S. cusia</italic> and three non-Lamiales cp genomes. The ancestral angiosperm IR regions are shown in square.</p></caption>
<graphic xlink:href="fpls-09-00324-g005.tif"/>
</fig>
<p>The genes at the IR/SSC regions are rather conserved (<bold>Figure <xref ref-type="fig" rid="F5">5</xref></bold>), given that <italic>ndhF</italic> (not shown in the alignment) and <italic>ycf1</italic> genes are found in the SSC regions near the borders in almost all examined cp genomes examined; both genes appeared on the left side of the alignment in <bold>Figures <xref ref-type="fig" rid="F5">5A,B</xref></bold>. By contrast, various patterns of expansion and contraction of the IR regions into or from the LSC regions were observed, as shown on the right side of the alignment in <bold>Figures <xref ref-type="fig" rid="F5">5A,B</xref></bold>.</p>
<p>LSC/IR regions can be divided into four different types based on the patterns for the 29 cp genomes (<bold>Figure <xref ref-type="fig" rid="F5">5A</xref></bold>) belonging to the Lamiales. Type I, the most dominant pattern, is found in 22 species, including <italic>D. hygrometricum</italic>, <italic>T. tetragonolobum</italic>, <italic>S. takesimensis</italic>, <italic>A. paniculata</italic>, <italic>Scutellaria insignis</italic>, <italic>Stenogyne kanehoana</italic>, <italic>Stenogyne haliakalae</italic>, <italic>Stenogyne bifida</italic>, <italic>Phyllostegia velutina</italic>, <italic>Haplostachys haplostachya</italic>, <italic>Stachys chamissonis</italic>, <italic>Stachys byzantina</italic>, <italic>Stachys coccinea</italic>, <italic>Stachys sylvatica</italic>, <italic>Premna microphylla</italic>, <italic>Tectona grandis</italic>, <italic>Jasminum nudiflorum</italic>, <italic>H. palmeri</italic>, <italic>O. woodiana</italic> subsp. <italic>woodiana</italic>, <italic>O. europaea</italic>, <italic>O. europaea</italic> subsp. <italic>maroccana</italic>, and <italic>O. europaea</italic> subsp. <italic>cuspidate</italic>. For this type, the genes included <italic>rpl2</italic>, <italic>rpl23</italic>, <italic>trnI</italic>, <italic>ycf2, trnL, ndhB</italic>, <italic>rps7</italic>, <italic>3-rps12</italic>, <italic>trnV</italic>, <italic>rrn16</italic>, <italic>trnI</italic>, <italic>trnA</italic>, <italic>rrn23</italic>, <italic>rrn4.5</italic>, <italic>rrn5</italic>, <italic>trnR</italic>, <italic>trnN</italic>, and <italic>ycf1</italic> (pseudogene), which are duplicated in the IR regions, except for <italic>rps19</italic>. The LSC/IR border patterns of <italic>O. woodiana</italic> subsp. <italic>woodiana</italic>, <italic>O. europaea</italic> subsp. <italic>maroccana</italic>, and <italic>O. europaea</italic> subsp. <italic>cuspidata</italic> are the same as that of <italic>O. europaea</italic>. As a result, their structures of the LSC/IR regions are not shown in <bold>Figure <xref ref-type="fig" rid="F5">5A</xref></bold>.</p>
<p>The Type II pattern is found in five species, including <italic>Scutellaria baicalensis</italic>, <italic>S. miltiorrhiza</italic>, <italic>Rosmarinus officinalis</italic>, <italic>Lavandula angustifolia</italic>, and <italic>S. indicum</italic>. This pattern shows an <italic>rps19</italic> pseudogene at the IR/LSC border. Meanwhile, Type III pattern is only found in <italic>R. breedlovei</italic>, in which the <italic>rps19, rpl2</italic>, and <italic>rpl22</italic> are not found in the IR region, and an <italic>ycf2</italic> pseudogene is found at the IR/LSC border.</p>
<p>Type IV is found only in the <italic>S. cusia</italic> cp genome. On the one hand, the genes of <italic>rps19</italic>, <italic>rpl2</italic>, <italic>rpl23</italic>, and <italic>ycf2</italic> are found in the IRs. On the other hand, the IR extends into the LSC regions to include a <italic>trnH</italic> gene and a truncated <italic>psbA</italic> pseudogene at the IR/LSC border. A similar pattern has been observed in several species other than Lamiales (<bold>Figure <xref ref-type="fig" rid="F5">5B</xref></bold>). For example, in the cp genomes of <italic>C. sativum</italic> and <italic>A. chinensis</italic>, the IR region extends into the <italic>psbA</italic> gene and engulfs a fragment of the <italic>psb</italic>A gene at the IR/LSC border. However, these patterns slightly vary. In the cp genome of <italic>C. sativum</italic>, a serial of genes, including <italic>rps19</italic>, <italic>rpl2</italic>, <italic>rpl23</italic>, <italic>ycf2</italic>, <italic>ndhB</italic>, <italic>rps7</italic>, and <italic>3-rps12</italic>, are excluded from the IR regions. Meanwhile, in <italic>A. chinensis</italic>, the IR-LSC border expanded to the <italic>ycf2</italic> gene. Compared with the cp genome of other Lamiales, the loss of genes <italic>rpl2</italic>, <italic>rpl23</italic>, and <italic>ycf2</italic> in the IR regions may be responsible for the considerably shortened length of <italic>S. cusia</italic> cp genome. The various patterns of the IR/LSC border reflect the highly dynamic nature of the IR/LSC border regions.</p>
</sec>
</sec>
<sec><title>Discussion</title>
<p>We carried out a detailed study of the cp genome of <italic>S. cusia</italic>. In particular, we (1) sequenced the total DNA from the leaves of <italic>S. cusia</italic>, (2) filtered the reads that are similar to cp genome of other species, (3) assembled the genome followed by gap-filling to obtain the complete cp genome, (4) annotated the genome to identify protein-coding genes, rRNAs, and tRNAs, (5) analyzed the repeat sequences, (6) identified multiple SSR sequences, (7) characterized the boundary of the IR regions, and (8) conducted phylogenetic analyses of <italic>S. cusia</italic> and several closely related species. The present study provides high-quality reference sequences that can be used to precisely determine the varieties of <italic>S. cusia</italic>.</p>
<p>With the widespread adoption of next-generation DNA sequencing technology and bioinformatics software tools, complete plastid genome sequencing becomes possible with the genome skimming approach (<xref ref-type="bibr" rid="B45">Twyford and Ness, 2016</xref>). In the current study and several of our previous studies (<xref ref-type="bibr" rid="B2">Chen et al., 2014</xref>; <xref ref-type="bibr" rid="B46">Wang et al., 2016</xref>), the use of Illumina and PacBio technologies can lead to the assembly of the complete cp genome without the tedious isolation of plastids to separate cp DNA from nuclear DNAs. However, the polyploidy nature of the plastid genome makes the heteroplasmic variations almost a rule rather than exception (<xref ref-type="bibr" rid="B23">Lei et al., 2016</xref>). Thus, the genome sequence reported here only represents the most predominant types, and the diversities among the various cp genomes may have been neglected. One future challenge is to accurately characterize the variations in plastid genomes to understand the evolution of thousands of copies of plastid genome within a particular cell, within an individual, or within a particular species.</p>
<p>Ban-Lan-Gen is considered a common name for the dried roots of indigo plants; among them, <italic>I. indigotica</italic> Fort and <italic>B. cusia</italic> (Nees) Bremek are the most frequently used plants. Pharmacological studies have confirmed the anti-inflammatory and anti-viral effects of Ban-Lan-Gen for the treatment of hepatitis, influenza, and various kinds of inflammation (<xref ref-type="bibr" rid="B42">Sun et al., 2008</xref>; <xref ref-type="bibr" rid="B12">Gu et al., 2014</xref>). Studies on the chemical components have identified several biologically active ingredients in Ban-Lan-Gen, including indigoid alkaloids (such as indigo and indirubin) and quinazolinone alkaloids (such as tryptanthrin) (<xref ref-type="bibr" rid="B15">Ichimaru et al., 2015</xref>). Indigo, indirubin, and tryptanthrin are three marker compounds found in Ban-Lan-Gen (<xref ref-type="bibr" rid="B31">Merz et al., 2004</xref>), and both <italic>I. indigotica</italic> Fort and <italic>B. cusia</italic> (Nees) Bremek contain these compounds. Meanwhile, indirubin causes the transactivation of cytochrome P450 1A1 (CYP1A1) and CYP1A2 genes via the aryl hydrocarbon receptor (<xref ref-type="bibr" rid="B33">Otsuka et al., 1988</xref>). These studies have demonstrated the effectiveness of Ban-Lan-Gen in the treatment of various diseases and presented concerns whether the biological components from various plant materials are identical. For ensuring consistent results from investigations and the efficacy and effective usage of any medicinal product with Ban-Lan-Gen as their source materials, the exact identity of the plant material should be determined. We carried out the sequencing and analysis of the complete genome of <italic>S. cusia</italic> to solve this problem.</p>
<p>The cp genome of <italic>S. cusia</italic> is the first cp genome in the genera <italic>Strobilanthes</italic> (Strobilanthinae sensu Bremekamp). Roughly 400 species were recorded in tropical Asia. Specifically, 128 species, including 57 endemic ones, were discovered in China (<xref ref-type="bibr" rid="B9">Flora of China Editorial Committee, 2011</xref>). Species belonging to this genera display significant high levels of homoplasy in morphological characters, thereby causing marked difficulty in subdividing the genus. By contrast, molecular studies do not improve the situation because of insufficient sampling. Even the available samples appear to be challenging because numerous species are known only from the type of collection or from materials that are inadequate for molecular study. Taking these results together, we find that although the clusters of related species are clearly discernible, sufficient information is currently unavailable to produce a satisfactory intra-generic classification. As a result, the acquisition of the first cp genome opens up the avenue for molecular classification of species in the genera.</p>
<p>As a proof of concept exercise, we designed a set of 1563 primers using the program ecoPrimer<sup><xref ref-type="fn" rid="fn02">2</xref></sup>. They were identified using the following parameters: &#x201C;-l 299 -L 301 -e 0 -t species&#x201D; and the detailed results are shown in Supplementary File <xref ref-type="supplementary-material" rid="SM1">S1</xref>. These primers can be used to distinguish <italic>S. cusia</italic> and three of its most closely related species: <italic>A. paniculata</italic>, <italic>R. breedlovei</italic> and <italic>T. tetragonolobum</italic>. In addition, we designed a set of primers that can be used to amplify 130 SSR sequences shown in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S3</xref> using the program primer3<sup><xref ref-type="fn" rid="fn03">3</xref></sup>. The detailed results are shown in Supplementary File <xref ref-type="supplementary-material" rid="SM1">S2</xref>. The validation of these primers for effective inter-specific and intra-specific discrimination will be the subject of future studies.</p>
<p>The cp genomes offer numerous applications. First, the cp genome is rich with molecular markers that can be used to distinguish different species (<xref ref-type="bibr" rid="B41">Song et al., 2015</xref>; <xref ref-type="bibr" rid="B55">Yang et al., 2016</xref>; <xref ref-type="bibr" rid="B52">Xu et al., 2017</xref>); different varieties from the same species (<xref ref-type="bibr" rid="B53">Xu et al., 2015</xref>; <xref ref-type="bibr" rid="B35">Pervaiz et al., 2016</xref>), and possibly different individuals within the same species (<xref ref-type="bibr" rid="B23">Lei et al., 2016</xref>). Owing to the acquisition of the first complete genome of <italic>S. cusia</italic>, sequencing of additional plastid genomes from other <italic>Strobilanthes</italic> species and varieties of <italic>S. cusia</italic> becomes increasingly easy, consequently providing the basis for the identification of molecular markers that can be used for identity determination at various levels. Second, the overall high conservation levels of the cp genome are useful for phylogenomic study. Third, plastid genomes have been implicated in genetic engineering to encode and express endogenous and exogenous proteins for health and economic benefits (<xref ref-type="bibr" rid="B6">Daniell et al., 2016</xref>; <xref ref-type="bibr" rid="B8">Dyo and Purton, 2018</xref>). Identification of the complete genome is a requirement for determining the appropriate insertion sites and designing the primers used in genetic engineering experiments. The results obtained from this study have laid the foundation for future cp-based genetic engineering of <italic>S. cusia</italic>.</p>
<p>The presence of two IRs is one of the most notable features in the cp genomes (cpDNAs). In general, the gene arrangement in IR regions in monocot genomes is different from that in eudicot genomes. For example, in monocots, the <italic>trnH</italic> gene is located in the IR region, and in most eudicots, <italic>trnH</italic> gene is located in the LSC region (<xref ref-type="bibr" rid="B14">Huotari and Korpelainen, 2012</xref>). In land plants, dynamic expansion/contraction of IRs has been previously reported in several lineages, such as Berberidaceae (<xref ref-type="bibr" rid="B30">Ma et al., 2013</xref>), Mimosoid legume (<xref ref-type="bibr" rid="B7">Dugas et al., 2015</xref>), Geraniaceae (<xref ref-type="bibr" rid="B47">Weng et al., 2014</xref>), and Hydatellaceae (<xref ref-type="bibr" rid="B11">Goremykin et al., 2013</xref>), which presents extreme expansions of IRs, Lauraceae (<xref ref-type="bibr" rid="B41">Song et al., 2015</xref>), and Apioideae (<xref ref-type="bibr" rid="B36">Plunkett and Downie, 2000</xref>), which exhibits extreme contractions of IRs. The fluctuating lengths of IRs contribute to increase or decrease cpDNA sizes and can be utilized to address phylogeny issues (<xref ref-type="bibr" rid="B50">Wolf et al., 2010</xref>).</p>
</sec>
<sec><title>Author Contributions</title>
<p>WW collected the sample of <italic>Strobilanthes cusia</italic> (Nees) Kuntze and wrote part of the Introduction and Discussion sections. CL conceived the study and wrote the Introduction and Discussion sections. ZZ and LH identified the plant material. JS extracted DNA. HC performed data analysis and wrote the manuscript. HZ, MJ, and DY performed the PCR experiments. MH, MR, XL, and BS performed the next-generation sequencing experiments.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>MH, MR, XL, and BS are employees of Illumina Corporation. The other authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This work was supported by grants from CAMS Innovation Fund for Medical Sciences (CIFMS) (2016-I2M-3-016 and 2017-I2M-1-013), from the Chinese Academy of Medical Science, Guangxi Science and Technology Program (AD16380013).</p>
</fn>
</fn-group>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2018.00324/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2018.00324/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.zip" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benson</surname> <given-names>G.</given-names></name></person-group> (<year>1999</year>). <article-title>Tandem repeats finder: a program to analyze DNA sequences.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>27</volume> <fpage>573</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1093/nar/27.2.573</pub-id> <pub-id pub-id-type="pmid">9862982</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Yuan</surname> <given-names>G.</given-names></name> <name><surname>Liu</surname> <given-names>C.</given-names></name></person-group> (<year>2014</year>). <article-title>Complex interplay among DNA modification, noncoding RNA expression and protein-coding RNA expression in <italic>Salvia miltiorrhiza</italic> chloroplast genome.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e99314</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0099314</pub-id> <pub-id pub-id-type="pmid">24914614</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><collab>Chinese Pharmacopoeia Commission</collab> (<year>2015</year>). <source><italic>The Pharmacopoeia of the People&#x2019;s Republic of China, 2015 Edition Part I.</italic></source> <publisher-loc>Beijing</publisher-loc>: <publisher-name>China Medical Science Press</publisher-name>.</citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chumley</surname> <given-names>T. W.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Mower</surname> <given-names>J. P.</given-names></name> <name><surname>Fourcade</surname> <given-names>H. M.</given-names></name> <name><surname>Calie</surname> <given-names>P. J.</given-names></name> <name><surname>Boore</surname> <given-names>J. L.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>The complete chloroplast genome sequence of <italic>Pelargonium x hortorum</italic>: organization and evolution of the largest and most highly rearranged chloroplast genome of land plants.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>23</volume> <fpage>2175</fpage>&#x2013;<lpage>2190</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msl089</pub-id> <pub-id pub-id-type="pmid">16916942</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>L.</given-names></name> <name><surname>Veeraraghavan</surname> <given-names>N.</given-names></name> <name><surname>Richter</surname> <given-names>A.</given-names></name> <name><surname>Wall</surname> <given-names>K.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Leebens-Mack</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>ChloroplastDB: the chloroplast genome database.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>34</volume> <fpage>D692</fpage>&#x2013;<lpage>D696</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkj055</pub-id> <pub-id pub-id-type="pmid">16381961</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Daniell</surname> <given-names>H.</given-names></name> <name><surname>Lin</surname> <given-names>C. S.</given-names></name> <name><surname>Yu</surname> <given-names>M.</given-names></name> <name><surname>Chang</surname> <given-names>W. J.</given-names></name></person-group> (<year>2016</year>). <article-title>Chloroplast genomes: diversity, evolution, and applications in genetic engineering.</article-title> <source><italic>Genome Biol.</italic></source> <volume>17</volume>:<issue>134</issue>. <pub-id pub-id-type="doi">10.1186/s13059-016-1004-2</pub-id> <pub-id pub-id-type="pmid">27339192</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dugas</surname> <given-names>D. V.</given-names></name> <name><surname>Hernandez</surname> <given-names>D.</given-names></name> <name><surname>Koenen</surname> <given-names>E. J.</given-names></name> <name><surname>Schwarz</surname> <given-names>E.</given-names></name> <name><surname>Straub</surname> <given-names>S.</given-names></name> <name><surname>Hughes</surname> <given-names>C. E.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Mimosoid legume plastome evolution: IR expansion, tandem repeat expansions, and accelerated rate of evolution in clpP.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>5</volume>:<issue>16958</issue>. <pub-id pub-id-type="doi">10.1038/srep16958</pub-id> <pub-id pub-id-type="pmid">26592928</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dyo</surname> <given-names>Y. M.</given-names></name> <name><surname>Purton</surname> <given-names>S.</given-names></name></person-group> (<year>2018</year>). <article-title>The algal chloroplast as a synthetic biology platform for production of therapeutic proteins.</article-title> <source><italic>Microbiology</italic></source> <volume>164</volume> <fpage>113</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1099/mic.0.000599</pub-id> <pub-id pub-id-type="pmid">29297850</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><collab>Flora of China Editorial Committee</collab> <role>(ed.)</role>. (<year>2011</year>). <source><italic>Flora of China.</italic></source> <publisher-loc>Beijing</publisher-loc>: <publisher-name>Science Press</publisher-name>.</citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Golden</surname> <given-names>J. L.</given-names></name> <name><surname>Bain</surname> <given-names>J. F.</given-names></name></person-group> (<year>2000</year>). <article-title>Phylogeographic patterns and high levels of chloroplast DNA diversity in four Packera (asteraceae) species in southwestern Alberta.</article-title> <source><italic>Evolution</italic></source> <volume>54</volume> <fpage>1566</fpage>&#x2013;<lpage>1579</lpage>. <pub-id pub-id-type="doi">10.1111/j.0014-3820.2000.tb00702.x</pub-id> <pub-id pub-id-type="pmid">11108585</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goremykin</surname> <given-names>V. V.</given-names></name> <name><surname>Nikiforova</surname> <given-names>S. V.</given-names></name> <name><surname>Biggs</surname> <given-names>P. J.</given-names></name> <name><surname>Zhong</surname> <given-names>B.</given-names></name> <name><surname>Delange</surname> <given-names>P.</given-names></name> <name><surname>Martin</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>The evolutionary root of flowering plants.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>62</volume> <fpage>50</fpage>&#x2013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/sys070</pub-id> <pub-id pub-id-type="pmid">22851550</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gu</surname> <given-names>W.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Hao</surname> <given-names>X. J.</given-names></name> <name><surname>Yang</surname> <given-names>F. M.</given-names></name> <name><surname>Sun</surname> <given-names>Q. Y.</given-names></name> <name><surname>Morris-Natschke</surname> <given-names>S. L.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Indole alkaloid glycosides from the aerial parts of <italic>Strobilanthes cusia</italic>.</article-title> <source><italic>J. Nat. Prod.</italic></source> <volume>77</volume> <fpage>2590</fpage>&#x2013;<lpage>2594</lpage>. <pub-id pub-id-type="doi">10.1021/np5003274</pub-id> <pub-id pub-id-type="pmid">25427242</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Honda</surname> <given-names>G.</given-names></name> <name><surname>Tabata</surname> <given-names>M.</given-names></name></person-group> (<year>1979</year>). <article-title>Isolation of antifungal principle tryptanthrin, from <italic>Strobilanthes cusia</italic> O. Kuntze.</article-title> <source><italic>Planta Med.</italic></source> <volume>36</volume> <fpage>85</fpage>&#x2013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1055/s-0028-1097245</pub-id> <pub-id pub-id-type="pmid">461559</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huotari</surname> <given-names>T.</given-names></name> <name><surname>Korpelainen</surname> <given-names>H.</given-names></name></person-group> (<year>2012</year>). <article-title>Complete chloroplast genome sequence of <italic>Elodea canadensis</italic> and comparative analyses with other monocot plastid genomes.</article-title> <source><italic>Gene</italic></source> <volume>508</volume> <fpage>96</fpage>&#x2013;<lpage>105</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2012.07.020</pub-id> <pub-id pub-id-type="pmid">22841789</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ichimaru</surname> <given-names>Y.</given-names></name> <name><surname>Saito</surname> <given-names>H.</given-names></name> <name><surname>Uchiyama</surname> <given-names>T.</given-names></name> <name><surname>Metori</surname> <given-names>K.</given-names></name> <name><surname>Tabata</surname> <given-names>K.</given-names></name> <name><surname>Suzuki</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Indirubin 3&#x2032;-(O-oxiran-2-ylmethyl)oxime: a novel anticancer agent.</article-title> <source><italic>Bioorg. Med. Chem. Lett.</italic></source> <volume>25</volume> <fpage>1403</fpage>&#x2013;<lpage>1406</lpage>. <pub-id pub-id-type="doi">10.1016/j.bmcl.2015.02.053</pub-id> <pub-id pub-id-type="pmid">25765906</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Cai</surname> <given-names>Z.</given-names></name> <name><surname>Raubeson</surname> <given-names>L. A.</given-names></name> <name><surname>Daniell</surname> <given-names>H.</given-names></name> <name><surname>Depamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Leebens-Mack</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Analysis of 81 genes from 64 plastid genomes resolves relationships in angiosperms and identifies genome-scale evolutionary patterns.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>104</volume> <fpage>19369</fpage>&#x2013;<lpage>19374</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0709121104</pub-id> <pub-id pub-id-type="pmid">18048330</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krumsiek</surname> <given-names>J.</given-names></name> <name><surname>Arnold</surname> <given-names>R.</given-names></name> <name><surname>Rattei</surname> <given-names>T.</given-names></name></person-group> (<year>2007</year>). <article-title>Gepard: a rapid and sensitive tool for creating dotplots on genome scale.</article-title> <source><italic>Bioinformatics</italic></source> <volume>23</volume> <fpage>1026</fpage>&#x2013;<lpage>1028</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm039</pub-id> <pub-id pub-id-type="pmid">17309896</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kuang</surname> <given-names>D. Y.</given-names></name> <name><surname>Wu</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>Y. L.</given-names></name> <name><surname>Gao</surname> <given-names>L. M.</given-names></name> <name><surname>Zhang</surname> <given-names>S. Z.</given-names></name> <name><surname>Lu</surname> <given-names>L.</given-names></name></person-group> (<year>2011</year>). <article-title>Complete chloroplast genome sequence of <italic>Magnolia kwangsiensis</italic> (Magnoliaceae): implication for DNA barcoding and population genetics.</article-title> <source><italic>Genome</italic></source> <volume>54</volume> <fpage>663</fpage>&#x2013;<lpage>673</lpage>. <pub-id pub-id-type="doi">10.1139/G11-026</pub-id> <pub-id pub-id-type="pmid">21793699</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumagai</surname> <given-names>T.</given-names></name> <name><surname>Aratsu</surname> <given-names>Y.</given-names></name> <name><surname>Sugawara</surname> <given-names>R.</given-names></name> <name><surname>Sasaki</surname> <given-names>T.</given-names></name> <name><surname>Miyairi</surname> <given-names>S.</given-names></name> <name><surname>Nagata</surname> <given-names>K.</given-names></name></person-group> (<year>2016</year>). <article-title>Indirubin, a component of Ban-Lan-Gen, activates CYP3A4 gene transcription through the human pregnane X receptor.</article-title> <source><italic>Drug Metab. Pharmacokinet.</italic></source> <volume>31</volume> <fpage>139</fpage>&#x2013;<lpage>145</lpage>. <pub-id pub-id-type="doi">10.1016/j.dmpk.2016.01.002</pub-id> <pub-id pub-id-type="pmid">26987505</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kurtz</surname> <given-names>S.</given-names></name> <name><surname>Choudhuri</surname> <given-names>J. V.</given-names></name> <name><surname>Ohlebusch</surname> <given-names>E.</given-names></name> <name><surname>Schleiermacher</surname> <given-names>C.</given-names></name> <name><surname>Stoye</surname> <given-names>J.</given-names></name> <name><surname>Giegerich</surname> <given-names>R.</given-names></name></person-group> (<year>2001</year>). <article-title>REPuter: the manifold applications of repeat analysis on a genomic scale.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>29</volume> <fpage>4633</fpage>&#x2013;<lpage>4642</lpage>. <pub-id pub-id-type="doi">10.1093/nar/29.22.4633</pub-id> <pub-id pub-id-type="pmid">11713313</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Laslett</surname> <given-names>D.</given-names></name> <name><surname>Canback</surname> <given-names>B.</given-names></name></person-group> (<year>2004</year>). <article-title>ARAGORN, a program to detect tRNA genes and tmRNA genes in nucleotide sequences.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>11</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh152</pub-id> <pub-id pub-id-type="pmid">14704338</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>E.</given-names></name> <name><surname>Harris</surname> <given-names>N.</given-names></name> <name><surname>Gibson</surname> <given-names>M.</given-names></name> <name><surname>Chetty</surname> <given-names>R.</given-names></name> <name><surname>Lewis</surname> <given-names>S.</given-names></name></person-group> (<year>2009</year>). <article-title>Apollo: a community resource for genome annotation editing.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1836</fpage>&#x2013;<lpage>1837</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp314</pub-id> <pub-id pub-id-type="pmid">19439563</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lei</surname> <given-names>W.</given-names></name> <name><surname>Ni</surname> <given-names>D.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Shao</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Intraspecific and heteroplasmic variations, gene losses and inversions in the chloroplast genome of <italic>Astragalus membranaceus</italic>.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>6</volume>:<issue>21669</issue>. <pub-id pub-id-type="doi">10.1038/srep21669</pub-id> <pub-id pub-id-type="pmid">26899134</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leister</surname> <given-names>D.</given-names></name></person-group> (<year>2003</year>). <article-title>Chloroplast research in the genomic age.</article-title> <source><italic>Trends Genet.</italic></source> <volume>19</volume> <fpage>47</fpage>&#x2013;<lpage>56</lpage>. <pub-id pub-id-type="doi">10.1016/S0168-9525(02)00003-3</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>T. C.</given-names></name> <name><surname>Qiao</surname> <given-names>Q.</given-names></name> <name><surname>Ren</surname> <given-names>Z.</given-names></name> <name><surname>Zhao</surname> <given-names>J.</given-names></name> <name><surname>Yonezawa</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Complete chloroplast genome sequence of holoparasite <italic>Cistanche deserticola</italic> (Orobanchaceae) reveals gene loss and horizontal gene transfer from its host <italic>Haloxylon ammodendron</italic> (Chenopodiaceae).</article-title> <source><italic>PLoS One</italic></source> <volume>8</volume>:<issue>e58747</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0058747</pub-id> <pub-id pub-id-type="pmid">23554920</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>C.</given-names></name> <name><surname>Shi</surname> <given-names>L.</given-names></name> <name><surname>Zhu</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>CpGAVAS, an integrated web server for the annotation, visualization, analysis, and GenBank submission of completely sequenced chloroplast genome sequences.</article-title> <source><italic>BMC Genomics</italic></source> <volume>13</volume>:<issue>715</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-13-715</pub-id> <pub-id pub-id-type="pmid">23256920</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Ahmed</surname> <given-names>S.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Guo</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>W.</given-names></name> <name><surname>Wu</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Ethnobotany of dye plants in Dong communities of China.</article-title> <source><italic>J. Ethnobiol. Ethnomed.</italic></source> <volume>10</volume>:<issue>23</issue>. <pub-id pub-id-type="doi">10.1186/1746-4269-10-23</pub-id> <pub-id pub-id-type="pmid">24552267</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lohse</surname> <given-names>M.</given-names></name> <name><surname>Drechsel</surname> <given-names>O.</given-names></name> <name><surname>Kahlau</surname> <given-names>S.</given-names></name> <name><surname>Bock</surname> <given-names>R.</given-names></name></person-group> (<year>2013</year>). <article-title>OrganellarGenomeDRAW&#x2013;a suite of tools for generating physical maps of plastid and mitochondrial genomes and visualizing expression data sets.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>41</volume> <fpage>W575</fpage>&#x2013;<lpage>W581</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt289</pub-id> <pub-id pub-id-type="pmid">23609545</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lowe</surname> <given-names>T. M.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>1997</year>). <article-title>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>25</volume> <fpage>955</fpage>&#x2013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1093/nar/25.5.0955</pub-id> <pub-id pub-id-type="pmid">9023104</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>B.</given-names></name> <name><surname>Zhu</surname> <given-names>W.</given-names></name> <name><surname>Sun</surname> <given-names>L.</given-names></name> <name><surname>Tian</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name></person-group> (<year>2013</year>). <article-title>The complete chloroplast genome sequence of <italic>Mahonia bealei</italic> (Berberidaceae) reveals a significant expansion of the inverted repeat and phylogenetic relationship with other angiosperms.</article-title> <source><italic>Gene</italic></source> <volume>528</volume> <fpage>120</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2013.07.037</pub-id> <pub-id pub-id-type="pmid">23900198</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Merz</surname> <given-names>K. H.</given-names></name> <name><surname>Schwahn</surname> <given-names>S.</given-names></name> <name><surname>Hippe</surname> <given-names>F.</given-names></name> <name><surname>Muhlbeyer</surname> <given-names>S.</given-names></name> <name><surname>Jakobs</surname> <given-names>S.</given-names></name> <name><surname>Eisenbrand</surname> <given-names>G.</given-names></name></person-group> (<year>2004</year>). <article-title>Novel indirubin derivatives, promising anti-tumor agents inhibiting cyclin-dependent kinases.</article-title> <source><italic>Int. J. Clin. Pharmacol. Ther.</italic></source> <volume>42</volume> <fpage>656</fpage>&#x2013;<lpage>658</lpage>. <pub-id pub-id-type="doi">10.5414/CPP42656</pub-id> <pub-id pub-id-type="pmid">15598038</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nock</surname> <given-names>C. J.</given-names></name> <name><surname>Waters</surname> <given-names>D. L.</given-names></name> <name><surname>Edwards</surname> <given-names>M. A.</given-names></name> <name><surname>Bowen</surname> <given-names>S. G.</given-names></name> <name><surname>Rice</surname> <given-names>N.</given-names></name> <name><surname>Cordeiro</surname> <given-names>G. M.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Chloroplast genome sequences from total DNA for plant identification.</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>9</volume> <fpage>328</fpage>&#x2013;<lpage>333</lpage>. <pub-id pub-id-type="doi">10.1111/j.1467-7652.2010.00558.x</pub-id> <pub-id pub-id-type="pmid">20796245</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Otsuka</surname> <given-names>H.</given-names></name> <name><surname>Hirai</surname> <given-names>Y.</given-names></name> <name><surname>Nagao</surname> <given-names>T.</given-names></name> <name><surname>Yamasaki</surname> <given-names>K.</given-names></name></person-group> (<year>1988</year>). <article-title>Anti-inflammatory activity of benzoxazinoids from roots of <italic>Coix lacryma-jobi</italic> var. ma-yuen.</article-title> <source><italic>J. Nat. Prod.</italic></source> <volume>51</volume> <fpage>74</fpage>&#x2013;<lpage>79</lpage>. <pub-id pub-id-type="doi">10.1021/np50055a009</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palme</surname> <given-names>A. E.</given-names></name> <name><surname>Su</surname> <given-names>Q.</given-names></name> <name><surname>Palsson</surname> <given-names>S.</given-names></name> <name><surname>Lascoux</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>Extensive sharing of chloroplast haplotypes among European birches indicates hybridization among <italic>Betula pendula</italic>, <italic>B. pubescens</italic> and <italic>B. nana</italic>.</article-title> <source><italic>Mol. Ecol.</italic></source> <volume>13</volume> <fpage>167</fpage>&#x2013;<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-294X.2003.02034.x</pub-id> <pub-id pub-id-type="pmid">14653797</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pervaiz</surname> <given-names>T.</given-names></name> <name><surname>Cheng</surname> <given-names>Z.</given-names></name> <name><surname>Faheem</surname> <given-names>M.</given-names></name> <name><surname>Fang</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>Chloroplast based genetic diversity among Chinese grapes genotypes.</article-title> <source><italic>Mitochondrial DNA A DNA Mapp. Seq. Anal.</italic></source> <volume>28</volume> <fpage>565</fpage>&#x2013;<lpage>569</lpage>. <pub-id pub-id-type="doi">10.3109/24701394.2016.1155119</pub-id> <pub-id pub-id-type="pmid">27159719</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Plunkett</surname> <given-names>G. M.</given-names></name> <name><surname>Downie</surname> <given-names>S. R.</given-names></name></person-group> (<year>2000</year>). <article-title>Expansion and contraction of the chloroplast inverted repeat in Apiaceae subfamily Apioideae.</article-title> <source><italic>Syst. Bot.</italic></source> <volume>25</volume> <fpage>648</fpage>&#x2013;<lpage>667</lpage>. <pub-id pub-id-type="doi">10.2307/2666726</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Revanna</surname> <given-names>K. V.</given-names></name> <name><surname>Chiu</surname> <given-names>C. C.</given-names></name> <name><surname>Bierschank</surname> <given-names>E.</given-names></name> <name><surname>Dong</surname> <given-names>Q.</given-names></name></person-group> (<year>2011</year>). <article-title>GSV: a web-based genome synteny viewer for customized data.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>12</volume>:<issue>316</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-12-316</pub-id> <pub-id pub-id-type="pmid">21810250</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rice</surname> <given-names>P.</given-names></name> <name><surname>Longden</surname> <given-names>I.</given-names></name> <name><surname>Bleasby</surname> <given-names>A.</given-names></name></person-group> (<year>2000</year>). <article-title>EMBOSS: the European molecular biology open software suite.</article-title> <source><italic>Trends Genet.</italic></source> <volume>16</volume> <fpage>276</fpage>&#x2013;<lpage>277</lpage>. <pub-id pub-id-type="doi">10.1016/S0168-9525(00)02024-2</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Silva</surname> <given-names>S. R.</given-names></name> <name><surname>Diaz</surname> <given-names>Y. C.</given-names></name> <name><surname>Penha</surname> <given-names>H. A.</given-names></name> <name><surname>Pinheiro</surname> <given-names>D. G.</given-names></name> <name><surname>Fernandes</surname> <given-names>C. C.</given-names></name> <name><surname>Miranda</surname> <given-names>V. F.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The chloroplast genome of <italic>Utricularia reniformis</italic> sheds light on the evolution of the ndh gene complex of terrestrial carnivorous plants from the Lentibulariaceae family.</article-title> <source><italic>PLoS One</italic></source> <volume>11</volume>:<issue>e0165176</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0165176</pub-id> <pub-id pub-id-type="pmid">27764252</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simpson</surname> <given-names>J. T.</given-names></name> <name><surname>Wong</surname> <given-names>K.</given-names></name> <name><surname>Jackman</surname> <given-names>S. D.</given-names></name> <name><surname>Schein</surname> <given-names>J. E.</given-names></name> <name><surname>Jones</surname> <given-names>S. J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name></person-group> (<year>2009</year>). <article-title>ABySS: a parallel assembler for short read sequence data.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1117</fpage>&#x2013;<lpage>1123</lpage>. <pub-id pub-id-type="doi">10.1101/gr.089532.108</pub-id> <pub-id pub-id-type="pmid">19251739</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>Y.</given-names></name> <name><surname>Dong</surname> <given-names>W.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Xu</surname> <given-names>C.</given-names></name> <name><surname>Yao</surname> <given-names>X.</given-names></name> <name><surname>Gao</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Comparative analysis of complete chloroplast genome sequences of two tropical trees <italic>Machilus yunnanensis</italic> and <italic>Machilus balansae</italic> in the family Lauraceae.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>6</volume>:<issue>662</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2015.00662</pub-id> <pub-id pub-id-type="pmid">26379689</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>X. B.</given-names></name> <name><surname>Sheng</surname> <given-names>J. R.</given-names></name> <name><surname>Wang</surname> <given-names>D. P.</given-names></name></person-group> (<year>2008</year>). <article-title>Research progress of chemical constituents and pharmacological activities for <italic>Baphicacanthus cusia</italic> (Nees)Bremek.</article-title> <source><italic>Guangxi Shifan Xueyuan Xuebao</italic></source> <volume>25</volume> <fpage>66</fpage>&#x2013;<lpage>69</lpage>.</citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stamatakis</surname> <given-names>A.</given-names></name></person-group> (<year>2015</year>). <article-title>Using RAxML to infer phylogenies.</article-title> <source><italic>Curr. Protoc. Bioinformatics</italic></source> <volume>51</volume> <issue>6</issue>.14.<fpage>1</fpage>&#x2013;<lpage>16</lpage>.14.14. <pub-id pub-id-type="doi">10.1002/0471250953.bi0614s51</pub-id> <pub-id pub-id-type="pmid">26334924</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Steane</surname> <given-names>D. A.</given-names></name></person-group> (<year>2005</year>). <article-title>Complete nucleotide sequence of the chloroplast genome from the Tasmanian blue gum, <italic>Eucalyptus globulus</italic> (Myrtaceae).</article-title> <source><italic>DNA Res.</italic></source> <volume>12</volume> <fpage>215</fpage>&#x2013;<lpage>220</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/dsi006</pub-id> <pub-id pub-id-type="pmid">16303753</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Twyford</surname> <given-names>A. D.</given-names></name> <name><surname>Ness</surname> <given-names>R. W.</given-names></name></person-group> (<year>2016</year>). <article-title>Strategies for complete plastid genome sequencing.</article-title> <source><italic>Mol. Ecol. Resour.</italic></source> <volume>17</volume> <fpage>858</fpage>&#x2013;<lpage>868</lpage>. <pub-id pub-id-type="doi">10.1111/1755-0998.12626</pub-id> <pub-id pub-id-type="pmid">27790830</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>B.</given-names></name> <name><surname>Chen</surname> <given-names>H.</given-names></name> <name><surname>Ma</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Lei</surname> <given-names>W.</given-names></name> <name><surname>Wu</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Complete plastid genome of <italic>Astragalus membranaceus</italic> (Fisch.) Bunge var. membranaceus.</article-title> <source><italic>Mitochondrial DNA B Resour.</italic></source> <volume>1</volume> <fpage>517</fpage>&#x2013;<lpage>519</lpage>. <pub-id pub-id-type="pmid">26899134</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weng</surname> <given-names>M. L.</given-names></name> <name><surname>Blazier</surname> <given-names>J. C.</given-names></name> <name><surname>Govindu</surname> <given-names>M.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name></person-group> (<year>2014</year>). <article-title>Reconstruction of the ancestral plastid genome in Geraniaceae reveals a correlation between genome rearrangements, repeats, and nucleotide substitution rates.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>31</volume> <fpage>645</fpage>&#x2013;<lpage>659</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst257</pub-id> <pub-id pub-id-type="pmid">24336877</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wicke</surname> <given-names>S.</given-names></name> <name><surname>Muller</surname> <given-names>K. F.</given-names></name> <name><surname>Depamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Quandt</surname> <given-names>D.</given-names></name> <name><surname>Bellot</surname> <given-names>S.</given-names></name> <name><surname>Schneeweiss</surname> <given-names>G. M.</given-names></name></person-group> (<year>2016</year>). <article-title>Mechanistic model of evolutionary rate variation en route to a nonphotosynthetic lifestyle in plants.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>113</volume> <fpage>9045</fpage>&#x2013;<lpage>9050</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1607576113</pub-id> <pub-id pub-id-type="pmid">27450087</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wicke</surname> <given-names>S.</given-names></name> <name><surname>Schneeweiss</surname> <given-names>G. M.</given-names></name> <name><surname>Depamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Muller</surname> <given-names>K. F.</given-names></name> <name><surname>Quandt</surname> <given-names>D.</given-names></name></person-group> (<year>2011</year>). <article-title>The evolution of the plastid chromosome in land plants: gene content, gene order, gene function.</article-title> <source><italic>Plant Mol. Biol.</italic></source> <volume>76</volume> <fpage>273</fpage>&#x2013;<lpage>297</lpage>. <pub-id pub-id-type="doi">10.1007/s11103-011-9762-4</pub-id> <pub-id pub-id-type="pmid">21424877</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolf</surname> <given-names>P. G.</given-names></name> <name><surname>Roper</surname> <given-names>J. M.</given-names></name> <name><surname>Duffy</surname> <given-names>A. M.</given-names></name></person-group> (<year>2010</year>). <article-title>The evolution of chloroplast genome structure in ferns.</article-title> <source><italic>Genome</italic></source> <volume>53</volume> <fpage>731</fpage>&#x2013;<lpage>738</lpage>. <pub-id pub-id-type="doi">10.1139/g10-061</pub-id> <pub-id pub-id-type="pmid">20924422</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>Z. Y.</given-names></name> <name><surname>Raven</surname> <given-names>P. H.</given-names></name> <name><surname>Hong</surname> <given-names>D. Y.</given-names></name></person-group> (<year>2006</year>). <source><italic>Flora of China</italic></source>. <publisher-loc>Beijing</publisher-loc>: <publisher-name>Science Press</publisher-name>.</citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>C.</given-names></name> <name><surname>Dong</surname> <given-names>W.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Lu</surname> <given-names>Y.</given-names></name> <name><surname>Xie</surname> <given-names>X.</given-names></name> <name><surname>Jin</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Comparative analysis of six <italic>Lagerstroemia</italic> complete chloroplast genomes.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>8</volume>:<issue>15</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2017.00015</pub-id> <pub-id pub-id-type="pmid">28154574</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>M.</given-names></name> <name><surname>Xu</surname> <given-names>L. A.</given-names></name> <name><surname>Cao</surname> <given-names>F. L.</given-names></name> <name><surname>Zhang</surname> <given-names>H. J.</given-names></name> <name><surname>Yu</surname> <given-names>F. X.</given-names></name></person-group> (<year>2015</year>). <article-title>Development of novel chloroplast microsatellite markers for <italic>Ginkgo biloba</italic>.</article-title> <source><italic>Genet. Mol. Res.</italic></source> <volume>14</volume> <fpage>7715</fpage>&#x2013;<lpage>7720</lpage>. <pub-id pub-id-type="doi">10.4238/2015.July.13.17</pub-id> <pub-id pub-id-type="pmid">26214452</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xue</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Zhou</surname> <given-names>S. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Polymorphic chloroplast microsatellite loci in Nelumbo (Nelumbonaceae).</article-title> <source><italic>Am. J. Bot.</italic></source> <volume>99</volume> <fpage>e240</fpage>&#x2013;<lpage>e244</lpage>. <pub-id pub-id-type="doi">10.3732/ajb.1100547</pub-id> <pub-id pub-id-type="pmid">22615305</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Y.</given-names></name> <name><surname>Zhou</surname> <given-names>T.</given-names></name> <name><surname>Duan</surname> <given-names>D.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Feng</surname> <given-names>L.</given-names></name> <name><surname>Zhao</surname> <given-names>G.</given-names></name></person-group> (<year>2016</year>). <article-title>Comparative analysis of the complete chloroplast genomes of five <italic>Quercus</italic> species.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>7</volume>:<issue>959</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2016.00959</pub-id> <pub-id pub-id-type="pmid">27446185</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://foc.eflora.cn/">http://foc.eflora.cn/</ext-link></p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="http://metabarcoding.org/obitools/doc/scripts/ecoPrimers.html">http://metabarcoding.org/obitools/doc/scripts/ecoPrimers.html</ext-link></p></fn>
<fn id="fn03"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="https://sourceforge.net/projects/primer3/">https://sourceforge.net/projects/primer3/</ext-link></p></fn>
</fn-group>
</back>
</article>