<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2016.01847</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Chloroplast Genome Sequence of Pigeonpea (<italic>Cajanus cajan</italic> (L.) Millspaugh) and <italic>Cajanus scarabaeoides</italic> (L.) Thouars: Genome Organization and Comparison with Other Legumes</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Kaila</surname> <given-names>Tanvi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/375972/overview"/></contrib>
<contrib contrib-type="author"><name><surname>Chaduvla</surname> <given-names>Pavan K.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/394296/overview"/></contrib>
<contrib contrib-type="author"><name><surname>Saxena</surname> <given-names>Swati</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/391807/overview"/></contrib>
<contrib contrib-type="author"><name><surname>Bahadur</surname> <given-names>Kaushlendra</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author"><name><surname>Gahukar</surname> <given-names>Santosh J.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref></contrib>
<contrib contrib-type="author"><name><surname>Chaudhury</surname> <given-names>Ashok</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref></contrib>
<contrib contrib-type="author"><name><surname>Sharma</surname> <given-names>T. R.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author"><name><surname>Singh</surname> <given-names>N. K.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref></contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Gaikwad</surname> <given-names>Kishor</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/374161/overview"/></contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>ICAR-National Research Centre on Plant Biotechnology</institution> <country>New Delhi, India</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Bio &#x00026; Nanotechnology, Guru Jambheshwar University of Science &#x00026; Technology</institution> <country>Hisar, India</country></aff>
<aff id="aff3"><sup>3</sup><institution>Biotechnology Department, Biotechnology Centre, Dr. Panjabrao Deshmukh Krishi Vidyapeeth</institution> <country>Akola, India</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Soren K. Rasmussen, University of Copenhagen, Denmark</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Ethalinda K. S. Cannon, Iowa State University, USA; Anil Khar, Indian Agricultural Research Institute, India</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Kishor Gaikwad <email>kish2012&#x00040;nrcpb.org</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Crop Science and Horticulture, a section of the journal Frontiers in Plant Science</p></fn></author-notes>
<pub-date pub-type="epub">
<day>09</day>
<month>12</month>
<year>2016</year>
</pub-date>
<pub-date pub-type="collection">
<year>2016</year>
</pub-date>
<volume>7</volume>
<elocation-id>1847</elocation-id>
<history>
<date date-type="received">
<day>05</day>
<month>09</month>
<year>2016</year>
</date>
<date date-type="accepted">
<day>23</day>
<month>11</month>
<year>2016</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2016 Kaila, Chaduvla, Saxena, Bahadur, Gahukar, Chaudhury, Sharma, Singh and Gaikwad.</copyright-statement>
<copyright-year>2016</copyright-year>
<copyright-holder>Kaila, Chaduvla, Saxena, Bahadur, Gahukar, Chaudhury, Sharma, Singh and Gaikwad</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>Pigeonpea (<italic>Cajanus cajan</italic> (L.) Millspaugh), a diploid (2n &#x0003D; 22) legume crop with a genome size of 852 Mbp, serves as an important source of human dietary protein especially in South East Asian and African regions. In this study, the draft chloroplast genomes of <italic>Cajanus cajan</italic> and <italic>Cajanus scarabaeoides</italic> (L.) Thouars were generated. <italic>Cajanus scarabaeoides</italic> is an important species of the <italic>Cajanus</italic> gene pool and has also been used for developing promising CMS system by different groups. A male sterile genotype harboring the <italic>C. scarabaeoides</italic> cytoplasm was used for sequencing the plastid genome. The cp genome of <italic>C. cajan</italic> is 152,242bp long, having a quadripartite structure with LSC of 83,455 bp and SSC of 17,871 bp separated by IRs of 25,398 bp. Similarly, the cp genome of <italic>C. scarabaeoides</italic> is 152,201bp long, having a quadripartite structure in which IRs of 25,402 bp length separates 83,423 bp of LSC and 17,854 bp of SSC. The pigeonpea cp genome contains 116 unique genes, including 30 tRNA, 4 rRNA, 78 predicted protein coding genes and 5 pseudogenes. A 50 kb inversion was observed in the LSC region of pigeonpea cp genome, consistent with other legumes. Comparison of cp genome with other legumes revealed the contraction of IR boundaries due to the absence of <italic>rps19</italic> gene in the IR region. Chloroplast SSRs were mined and a total of 280 and 292 cpSSRs were identified in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. RNA editing was observed at 37 sites in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>, with maximum occurrence in the <italic>ndh</italic> genes. The pigeonpea cp genome sequence would be beneficial in providing informative molecular markers which can be utilized for genetic diversity analysis and aid in understanding the plant systematics studies among major grain legumes.</p></abstract>
<kwd-group>
<kwd><italic>Cajanus cajan</italic></kwd>
<kwd><italic>Cajanus scarabaeoides</italic></kwd>
<kwd>chloroplast genome</kwd>
<kwd>Roche 454 sequencing</kwd>
<kwd>RNA editing</kwd>
</kwd-group>
<counts>
<fig-count count="8"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="100"/>
<page-count count="16"/>
<word-count count="10731"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1"><title>Introduction</title>
<p>Pigeonpea (<italic>Cajanus cajan</italic> (L.) <italic>Millspaugh</italic>) popularly known as arhar, tur and red gram, is an important food legume crop, predominantly cultivated in tropical and subtropical regions of the world. It is a diploid (2n &#x0003D; 22) plant with an estimated genome size of 852 Mbp (Singh et al., <xref ref-type="bibr" rid="B80">2012</xref>) and belongs to subfamily Papilionoideae, and family Leguminosae (Sharma and Green, <xref ref-type="bibr" rid="B77">1980</xref>)</p>
<p>In the recent past, genome sequencing of pigeonpea has been reported (Varshney et al., <xref ref-type="bibr" rid="B87">2011</xref>; Singh et al., <xref ref-type="bibr" rid="B80">2012</xref>) along with the, mitochondrial genome (Tuteja et al., <xref ref-type="bibr" rid="B85">2013</xref>) but chloroplast genome sequencing has not been decoded so far. The first complete chloroplast (cp) genome sequences to be decoded were of tobacco and liverwort in 1986 (Ohyama et al., <xref ref-type="bibr" rid="B53">1986</xref>; Shinozaki et al., <xref ref-type="bibr" rid="B79">1986</xref>). Till date, the chloroplast genome sequences of a number of land plants and algae have been reported. Among the land plants, 888 complete chloroplast genomes have been sequenced till date<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref> and which includes 44 genomes belonging to the Leguminosae family are available including those of for example <italic>Cicer arietinum</italic> (Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>), <italic>Trifolium subterraneum</italic> (Cai et al., <xref ref-type="bibr" rid="B5">2008</xref>), <italic>Phaseolus vulgaris</italic> (Guo et al., <xref ref-type="bibr" rid="B21">2007</xref>), <italic>Lotus japonica</italic> (Kato et al., <xref ref-type="bibr" rid="B33">2000</xref>), <italic>Glycine max</italic> (Saski et al., <xref ref-type="bibr" rid="B73">2005</xref>), <italic>Medicago truncatula</italic> (Young et al., <xref ref-type="bibr" rid="B100">2011</xref>), and <italic>Vigna radiata</italic> (Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>). Sequencing of complete plastid genomes has been made easy by development of next generation sequencing technologies. The first attempt to use next generation sequencing technology (454 GS 20 system) for the sequencing of chloroplast genome was made by Moore et al. (<xref ref-type="bibr" rid="B49">2006</xref>). As the genetic features of the chloroplast genome are relatively simple, it has contributed to the study of molecular systematics and DNA barcoding (Dong et al., <xref ref-type="bibr" rid="B13">2012</xref>). Uniparental inheritance, low level of recombination and lower substitution rates in comparison to nuclear genome, makes chloroplast genome sequence useful for phylogenetic analysis (Provan et al., <xref ref-type="bibr" rid="B65">2001</xref>) and species identification (Li et al., <xref ref-type="bibr" rid="B39">2015</xref>).</p>
<p>A typical plant chloroplast genome consists of single circular chromosome with a quadripartite structure, which includes two copies of an inverted repeat (IR) spanning 12&#x02013;75 kb that separates the large and small single copy regions, LSC (80&#x02013;90 kb) and SSC (16&#x02013;27 kb). Expansion, contraction or loss of the IR and variation in length of intergenic spacers leads to variation in length of genomes but generally the size of chloroplast genome of photosynthetic organisms ranges between 115 and 165 kb (Palmer, <xref ref-type="bibr" rid="B57">1991</xref>; Raubeson and Jansen, <xref ref-type="bibr" rid="B68">2005</xref>). A typical angiosperm chloroplast contains 110&#x02013;130 genes comprising of 4 rRNA, 30&#x02013;31 tRNA, and 80&#x02013;90 protein coding genes. The IR region comprises of a duplicated set of tRNA and rRNA genes while the single copy regions mostly consists of the genes encoding ribosomal proteins, RNA polymerase subunits, proteins associated with photosystems, as well as protein subunits for NADH dehydrogenase complex. The two IRs are inverted replicas of each other and hence the genes in the IR are present in two copies (Bock, <xref ref-type="bibr" rid="B1">2007</xref>). Increased gene dosage and genome stabilization have been proposed as the reason for the presence of two copies of IR but absence of one copy of IR from some higher plant cp genomes have shown that it is dispensable for the plastome function (Palmer and Thompson, <xref ref-type="bibr" rid="B61">1982</xref>).</p>
<p>Even though chloroplast genome structure seems to be highly conserved among plants, there are some differences in terms of gene synteny and copy number. For instance, gene duplications are reported for few tRNA genes, <italic>ycf2, rpl23</italic>, and <italic>psbA</italic> in some and loss of <italic>accD, psaI, rpl23, rps16, ycf4</italic>, and <italic>infA</italic> in others (Jansen et al., <xref ref-type="bibr" rid="B30">2007</xref>; Magee et al., <xref ref-type="bibr" rid="B43">2010</xref>). It is also reported that ndhF and ycf2 genes were lost repeatedly from a variety of angiosperms during the course of evolution (Shinozaki et al., <xref ref-type="bibr" rid="B79">1986</xref>; Wolfe et al., <xref ref-type="bibr" rid="B93">1992</xref>; Sato et al., <xref ref-type="bibr" rid="B74">1999</xref>). Pseudogenes are also observed in various land plants like <italic>ycf2</italic> which is responsible for cell viability in rice and maize (Hiratsuka et al., <xref ref-type="bibr" rid="B22">1989</xref>; Maier et al., <xref ref-type="bibr" rid="B44">1995</xref>), <italic>infA</italic> gene (translation initiation factor) in tobacco, <italic>Arabidopsis</italic> and <italic>Oenothera elata</italic> and <italic>rpl23</italic> gene in spinach (Thomas et al., <xref ref-type="bibr" rid="B83">1988</xref>). In contrast, cp genomes of the plants belonging to fabaceae family have been reported to undergo extensive rearrangements as compared to other angiosperms (Kato et al., <xref ref-type="bibr" rid="B33">2000</xref>; Guo et al., <xref ref-type="bibr" rid="B21">2007</xref>; Cai et al., <xref ref-type="bibr" rid="B5">2008</xref>; Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>) Complete loss of the inverted repeat (IR) which occurred rarely during evolution of angiosperm has been reported in pea (Palmer and Thompson, <xref ref-type="bibr" rid="B60">1981</xref>).</p>
<p>The loss of one copy of IR has occurred in a large clade of papilionoid legumes which includes the tribes <italic>Carmichaelieae, Cicereae, Galegeae, Hedysareae, Trifolieae</italic>, and <italic>Fabeae</italic>. The monophyly of IR- lacking clade (IRLC) (Wojciechowski et al., <xref ref-type="bibr" rid="B92">2000</xref>) has been confirmed with the help of phylogenetic analysis by using plastid genes <italic>matK</italic> (Wojciechowski et al., <xref ref-type="bibr" rid="B91">2004</xref>), <italic>rbcl</italic> (Doyle et al., <xref ref-type="bibr" rid="B16">1997</xref>), <italic>trnL</italic> intron (Pennington et al., <xref ref-type="bibr" rid="B62">2001</xref>), and ITS regions of nuclear ribosomal DNA (Hu et al., <xref ref-type="bibr" rid="B25">2002</xref>). The chloroplast genomes sequenced from IRLC includes: <italic>Trifolium aureum; T. repens; T. grandiflorum</italic> and <italic>T. subterraneum</italic> (clover); <italic>C. arietinum</italic> (chickpea); <italic>M. truncatula</italic> (barrel medic); <italic>Pisum sativum</italic> (pea); <italic>Lathyrus sativus</italic> (grass pea); <italic>Lens culinaris</italic> (lentil); <italic>Glycyrrhiza glabra</italic> (licorice); and <italic>Vicia faba</italic> (broad bean) (Saski et al., <xref ref-type="bibr" rid="B73">2005</xref>; Cai et al., <xref ref-type="bibr" rid="B5">2008</xref>; Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>; Magee et al., <xref ref-type="bibr" rid="B43">2010</xref>; Sabir et al., <xref ref-type="bibr" rid="B72">2014</xref>). Also it is now believed that loss of IR made the chloroplast genome more prone to rearrangements, like a 50 kb inversion reported in mung bean (Palmer and Thompson, <xref ref-type="bibr" rid="B61">1982</xref>), is present in most members of the papilionoideae subfamily which changes the gene order between <italic>trnK</italic> and <italic>accD</italic> genes in the LSC region (Palmer et al., <xref ref-type="bibr" rid="B59">1988</xref>). Another inversion encompassing a 78 kb region in LSC was first reported in <italic>Phaseolus</italic> and <italic>Vigna</italic>, a member of subtribe phaseolinae and tribe phaseoleae (Bruneau et al., <xref ref-type="bibr" rid="B2">1990</xref>; Guo et al., <xref ref-type="bibr" rid="B21">2007</xref>; Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>) and a newly reported 36 kb inversion within the 50 kb inversion present in lupines and other genisotoids (Martin et al., <xref ref-type="bibr" rid="B47">2014</xref>). There seems to be variation in the legumes for the presence of certain genes. Genes <italic>infA</italic> and <italic>rpl22</italic> are not encoded by legume chloroplasts (Doyle et al., <xref ref-type="bibr" rid="B17">1995</xref>), rather it is reported that their nuclear copies are being directed toward the chloroplast (Gantt et al., <xref ref-type="bibr" rid="B20">1991</xref>; Millen et al., <xref ref-type="bibr" rid="B48">2001</xref>). The <italic>accD</italic> gene is also reported to be functionally transferred to the nucleus in <italic>Trifolium</italic> species (Magee et al., <xref ref-type="bibr" rid="B43">2010</xref>). The loss of intron in the <italic>clpP</italic> and <italic>rps12</italic> genes has also been mapped to Leguminosae phylogeny (Doyle et al., <xref ref-type="bibr" rid="B17">1995</xref>; Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>).</p>
<p>Microsatellites or Simple sequence repeats (SSRs) are short DNA sequence stretches in which a motif of one to six bases is tandemly repeated (Schl&#x000F6;tterer, <xref ref-type="bibr" rid="B75">2000</xref>). Powell et al. (<xref ref-type="bibr" rid="B64">1995</xref>) reported likewise nuclear SSRs, chloroplast microsatellites also demonstrate significant polymorphism. Chloroplast SSRs demonstrate high level of intraspecific variation and thus are considered as potential markers in evolutionary, population and systematics studies in plants (Provan et al., <xref ref-type="bibr" rid="B65">2001</xref>).</p>
<p>Of late, cp genome sequencing has acquired new dimensions. Recent methods like amplification of entire genome using rolling circle amplification (Dhingra and Folta, <xref ref-type="bibr" rid="B12">2005</xref>), high throughput sequencing (Moore et al., <xref ref-type="bibr" rid="B49">2006</xref>; Cronn et al., <xref ref-type="bibr" rid="B9">2008</xref>; Yan et al., <xref ref-type="bibr" rid="B96">2015</xref>) have been successful in achieving fast and cost effective chloroplast genome sequencing. Pigeonpea genomics is gathering speed and that requires availability of all types of genomics resources. The sequence of plastid genomes of pigeonpea will aid in effective utilization for genotyping. Here we report the use of Roche 454 FLX sequencing technology for obtaining draft chloroplast genome sequence of <italic>Cajanus cajan</italic> and <italic>Cajanus scarabaeoides</italic> for understanding the genome organization, editing changes and mining of SSR markers.</p>
</sec>
<sec sec-type="materials and methods" id="s2"><title>Materials and methods</title>
<sec><title>Plant material and DNA isolation</title>
<p>Cytoplasmic male sterile pigeonpea AKPA1 (<italic>C. scarabaeoides</italic> cytoplasm) and its fertility restorer AKPR375 (<italic>C. cajan</italic> cytoplasm) were used in this study. Fresh leaves were harvested from seedlings and were kept in the dark for 48 h prior to chloroplast DNA isolation. Chloroplast DNA isolation was performed as per Kirti et al. (<xref ref-type="bibr" rid="B35">1993</xref>).</p>
</sec>
<sec><title>Chloroplast genome sequencing, assembly and annotation</title>
<p>The plastid DNA (1 &#x003BC;g) was sheared by nebulization and purified to obtain the desired size range. Library preparation and sequencing by Roche 454 GS FLX platform was carried out as per manufacturer&#x00027;s instructions. Two biological replicates were later pooled for data analysis.</p>
<p>Pyrosequencing was performed on a Genome Sequencer FLX system using Titanium Chemistry (Roche, 454). The per base quality of the raw reads (496,972, 498,603) was assessed by FastQC V0.11.4<xref ref-type="fn" rid="fn0002"><sup>2</sup></xref>. Quality filtering was done using PRINSEQ lite V0.20.4 (Schmieder and Edwards, <xref ref-type="bibr" rid="B76">2011</xref>; phred Q &#x02265; 20, Length &#x02265; 50). Quality filtered reads were <italic>denovo</italic> assembled using Newbler (GS <italic>de novo</italic> Assembler) v2.6 programme with default parameters.</p>
<p>Contigs larger than 200 bp were extracted to construct consensus using <italic>G. max</italic> chloroplast genome. Contigs were aligned to <italic>G. max</italic> cp genome sequence by BLASTN (<ext-link ext-link-type="uri" xlink:href="https://www.nih.gov/">https://www.nih.gov/</ext-link>). Contigs with &#x0003E;80% matches were ordered against the reference. Gap between adjacent contigs was initially filled with &#x0201C;N&#x0201D; to construct consensus cp genome. The gaps in the genome were filled by alignment of filtered reads using CLC Genomics Workbench 7.5.1 (CLC Bio, Arhus, Denmark) with following parameters: Length fraction &#x0003D; 0.5, Similarity &#x0003D; 0.9 to the end and gap filling extended read-contig regions were merged where 10 bp or more bp overlapping till a single large fragment was obtained.</p>
<p>Genome annotation was carried out with DOGMA (Dual Organellar Genome Annotator; Wyman et al., <xref ref-type="bibr" rid="B94">2004</xref>) to identify coding sequences (cds), rRNAs, and tRNAs using the plastid genetic code and BLAST homology searches. To verify the exact gene and exon boundaries, we compared Pigeonpea annotations with those of <italic>G. max</italic> and manually corrected the start and stop codons. The presence of tRNA genes were also confirmed by online tRNAscan-SE 1.21 search serve (Lowe and Eddy, <xref ref-type="bibr" rid="B41">1997</xref>).</p>
<p>The entire cp sequences of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> genotypes, along with gene annotations were submitted to GenBank (accession number: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="KU729878">KU729878</ext-link> for <italic>C. scarabaeoides</italic> and KU729879 for <italic>C. cajan</italic>).</p>
</sec>
<sec><title>PCR amplification</title>
<p>To confirm the junctions between LSC and IR; SSC and IR, PCR amplification was carried out in a total reaction volume of 20 &#x003BC;l containing 30 ng of DNA template, 1 &#x000D7; buffer, 0.2 mM dNTPs, 2.5 mM MgCl<sub>2</sub>, 1U DNA Polymerase and 0.5 &#x003BC;M each of forward and reverse primers. Primer pair&#x02014;(i) LI_F1: TCCCTCGACACCAGAAGATA, LI_R1: CCGGATCTAAATGTTGGCTA, (ii) LI2_F2: GTCGGACAAGTGGGAAATGT, LI2_R2: CCGAGCTAACCTTGGTATGG were used to amplify the junction between LSC and IR. And the primer pair&#x02014;(i) SI_F1: GTTGGTTTAAATAGCCCCG; SI_R1:CCATCTGTTAACCATTTTTGGGG, (ii) SI_F2:TGTGATTATTGCCGAAGAACTG,SI_R2:CGTTCTCAACCCATGACCAA were used to amplify the junction between SSC and IR. Amplification was performed in Techne PCR: 94&#x000B0;C for 3 min followed by 40 cycles of 94&#x000B0;C for 30 s, 52&#x000B0;C for 30 s, 72&#x000B0;C for 1 min and a final extension step at 72&#x000B0;C for 10 min. Amplified products were separated on a 1.2% agarose gel.</p>
</sec>
<sec><title>Genome analysis</title>
<p>Full alignments of legume cp genomes were performed using mVISTA program (Frazer et al., <xref ref-type="bibr" rid="B18">2004</xref>) in Shuffle-LAGAN mode. Selected legume cp genomes were retrieved from NCBI: <italic>G</italic>. <italic>max</italic> (NC_7942), <italic>P. vulgaris</italic> (NC_9259), <italic>Cicer areitinum</italic> (NC_11163), <italic>V. radiata</italic> (NC_13843) and used as a reference.</p>
<p>The comparison of gene order between the chloroplast genomes of <italic>C. cajan, C. scarabaeoides, Arabidopsis thaliana</italic> (NC_000932), <italic>G. max</italic> (NC_7942), <italic>P. vulgaris</italic> (NC_9259), <italic>C. areitinum</italic> (NC_11163), <italic>V. radiata</italic> (NC_13843), and <italic>M. truncatula</italic> (NC_003119) was performed with MAUVE (Darling et al., <xref ref-type="bibr" rid="B11">2004</xref>). Codon usage was calculated for all exons of protein-coding genes with CodonW 1.4.4. Base composition was calculated by DNA/RNA base composition calculator<xref ref-type="fn" rid="fn0003"><sup>3</sup></xref>.</p>
</sec>
<sec><title>RNA editing analysis</title>
<p>Predictive RNA Editor for Plants (PREP) suite<xref ref-type="fn" rid="fn0004"><sup>4</sup></xref> was used to predict RNA editing sites (Mower, <xref ref-type="bibr" rid="B51">2009</xref>). For the analysis, the cut-off value was set at 0.8. The PREP-cp program consists of 35 reference genes for predicting RNA editing sites in the chloroplast genomes. The editing sites were validated by mapping the transcriptome data (unpublished data) onto the DNA sequences from the chloroplast in CLC Genomics Workbench 7.5.1 (CLC Bio, Arhus, Denmark). The sites having more than 5X coverage (C&#x02013;U) were considered as true editing changes.</p>
</sec>
<sec><title>SSR analysis</title>
<p>Chloroplast microsatellites (cpSSRs) were identified in high quality sequence of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> by using MISA<xref ref-type="fn" rid="fn0005"><sup>5</sup></xref> perl script. The identified cpSSRs included mononucleotide repeats &#x02265; 8 bases, dinucleotides &#x02265; 10 bases (five repeats) and trinucleotides and tetranucleotides &#x02265; 12 bases (four and three repeats respectively), pentanucleotide &#x02265; 15 bases (3 repeats) and hexanucleotides &#x02265; 18 bases (3 repeats).</p>
</sec>
</sec>
<sec id="s3"><title>Results and discussion</title>
<sec><title>Chloroplast genome assembly</title>
<p>Roche-454 Sequencing of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> chloroplast genomes from purified DNA generated about 496,972 and 498,603 reads respectively. Filtered reads (496,228 and 497,800) were used for <italic>de novo</italic> assembly using Newbler (v.2.6 454 Life Science). A total of 13,732 (N50, 900 bp) and 13,002 (N50, 889 bp) contigs from <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> were respectively obtained with size ranging from 200 to 79,709 bases. They were then organized by using <italic>G. max</italic> chloroplast as reference. The contigs with &#x0003E;80% matches were used to build a draft consensus. Finally, to fill gaps in the consensus, filtered reads were aligned to draft consensus and the sequence of the read-contig in the direction of the gap were compared. If there was an overlap of 10 bp or more, the two contigs were joined together. Using this strategy, we achieved a minimum coverage of 99.96% of the cp genome for the <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> chloroplast genome. The size of cp genomes of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> was found to be 152,201 bp and 152,242 bp. Finally, the four junctions between IRs and LSC/SSC were confirmed and validated by PCR amplification.</p>
</sec>
<sec><title>Genome content and organization of the pigeonpea plastid genome</title>
<p>The cp genomes of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> are 152,201 bp and 152,242 bp in length respectively. It consists of a quadripartite structure with IRs of 25,402 bp separating 83,423 bp of LSC and 17,854 bp of SSC in <italic>C. scarabaeoides</italic>, while 25,398 bp of IR separates 83,455 bp of LSC and 17,871 bp of SSC in <italic>C. cajan</italic> (Figures <xref ref-type="fig" rid="F1">1</xref>, <xref ref-type="fig" rid="F2">2</xref>). The cp genome of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> differs slightly from <italic>G. max</italic> (152,218 bp) and other legumes (<italic>V. radiata</italic>-151,271 bp; <italic>P. vulgaris</italic>-150,285 bp; <italic>C. arietinum</italic>-125,319 bp) in terms of size, (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>Map of <italic>C. scarabaeoides</italic> plastid genome</bold>. Genes shown on the outside of the map are transcribed clockwise while the genes that are shown on the inside are transcribed counterclockwise. The innermost darker gray corresponds to GC content, whereas the lighter gray corresponds to AT content. Different genes are color coded. IR, inverted repeat; LSC, large single copy region; SSC, small single copy region. Pseudogenes are marked with &#x0201C;<sup>&#x0002A;</sup>.&#x0201D;</p></caption>
<graphic xlink:href="fpls-07-01847-g0001.tif"/>
</fig>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>Map of <italic>C. cajan</italic> plastid genome</bold>. Genes shown on the outside of the map are transcribed clockwise while the genes that are shown on the inside are transcribed counterclockwise. The innermost darker gray corresponds to GC content, whereas the lighter gray corresponds to AT content. Different genes are color coded. IR, inverted repeat; LSC, large single copy region; SSC, small single copy region. Pseudogenes are marked with &#x0201C;<sup>&#x0002A;</sup>.&#x0201D;</p></caption>
<graphic xlink:href="fpls-07-01847-g0002.tif"/>
</fig>
<p>Both plastid genomes contain 116 unique genes, which include 30 tRNA, 4 rRNA, 78 predicted protein coding genes and 5 peudogenes. The LSC region consists of 58 protein coding genes and SSC region consists of 13 protein coding genes in both genotypes. The tRNA coding genes represents 20 amino acids in both genotypes and are distributed throughout the genome, with one tRNA coding gene present in the SSC region, 22 in the LSC region and 7 in the IR region of both. For the 61 possible codons (excluding stop codon), 28 tRNAs exist in the cp genome of both genotypes. The <italic>trnT-GGU</italic> and <italic>trnM-CAU</italic> genes are duplicated in the LSC region of both cp genomes. Similar tRNA genes duplications have also been reported in the cp genome of <italic>Actinidia</italic>, black pine and green algae (Tsudzuki et al., <xref ref-type="bibr" rid="B84">1994</xref>; Wakasugi et al., <xref ref-type="bibr" rid="B88">1997</xref>; Yao et al., <xref ref-type="bibr" rid="B98">2015</xref>). The IR region consists of 7 tRNA coding genes, 4 rRNA coding genes, 8 protein coding genes (<italic>rpl2, rpl23, ycf2, ndhB, rps7, rps12, orf42</italic>, and <italic>orf56</italic>) and 2 pseudogenes (<italic>ycf15</italic> and <italic>ycf68</italic>) in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> (Table <xref ref-type="table" rid="T1">1</xref>), thus these genes seem to be generally duplicated in the IR regions. Therefore, in total 138 genes are present in the cp genome of pigeonpea (Figures <xref ref-type="fig" rid="F1">1</xref>, <xref ref-type="fig" rid="F2">2</xref>). Trans-splicing is observed in <italic>rps12</italic> gene with 5&#x02032; end exon present in the LSC region and the 3&#x02032; end exon duplicated and present in the IR region.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><bold>List of genes present in the cp genome of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic></bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Category</bold></th>
<th valign="top" align="left"><bold>Gene Name</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Photosystem I</td>
<td valign="top" align="left"><italic>psaA,B,C,I,J,Ycf3<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref>,ycf4</italic></td>
</tr>
<tr>
<td valign="top" align="left">Photosystem II</td>
<td valign="top" align="left"><italic>psbA,B,C,D,E,F,H,I,J,K,L,M,N,T,Z/lhbA</italic></td>
</tr>
<tr>
<td valign="top" align="left">Cytochrome b6/f</td>
<td valign="top" align="left"><italic>petA,B,D,G,L,N</italic></td>
</tr>
<tr>
<td valign="top" align="left">ATP Synthase</td>
<td valign="top" align="left"><italic>atpA,B,E,F<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref>,H,I</italic></td>
</tr>
<tr>
<td valign="top" align="left">Rubisco</td>
<td valign="top" align="left"><italic>rbcL</italic></td>
</tr>
<tr>
<td valign="top" align="left">NADH Oxidoreductase</td>
<td valign="top" align="left"><italic>ndhA,B<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,C,D,E,F,G,H,I,J,K</italic></td>
</tr>
<tr>
<td valign="top" align="left">Large subunit ribosomal proteins</td>
<td valign="top" align="left"><italic>rpl2<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,14,16,20,23<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,32,33<xref ref-type="table-fn" rid="TN5"><sup>e</sup></xref>,36</italic></td>
</tr>
<tr>
<td valign="top" align="left">Small subunit ribosomal proteins</td>
<td valign="top" align="left"><italic>rps2,3,4,7<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,8,11,12<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN4"><sup>d</sup></xref>,14,15,16<xref ref-type="table-fn" rid="TN5"><sup>e</sup></xref>,18,19</italic></td>
</tr>
<tr>
<td valign="top" align="left">RNAP</td>
<td valign="top" align="left"><italic>rpoA,rpoB,C1<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref>,C2</italic>,</td>
</tr>
<tr>
<td valign="top" align="left">Other Proteins</td>
<td valign="top" align="left"><italic>accD, ccsA,matK,cemA,clpP<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref></italic>,</td>
</tr>
<tr>
<td valign="top" align="left">Proteins of unknown Function</td>
<td valign="top" align="left"><italic>ycf1<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN4"><sup>e</sup></xref>,ycf2<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, ycf15<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN4"><sup>e</sup></xref>,ycf68<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN4"><sup>e</sup></xref>,orf42<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,orf56<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,orf188</italic></td>
</tr>
<tr>
<td valign="top" align="left">Ribosomal RNAs</td>
<td valign="top" align="left"><italic>rrn23<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,16<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,5<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,4.5<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref></italic></td>
</tr>
<tr>
<td valign="top" align="left">Transfer RNAs</td>
<td valign="top" align="left"><italic>trnH(GUG), K(UUU)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref>,M(CAU),T(GGU),V(UAC)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref>,F(GAA),L(UAA)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref>,T(UGU),S(GGA),fM(CAU), G(UCC),S(UGA),E(UUC),Y(GUA),D(GUC),C(GCA),R(UCU),S(GCU),Q(UUG), W(CCA), P(UGG), P(GGG), I(CAU)<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, L(CAA)<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, V(GAC)<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, I(GAU)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, A(UGC)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref><sup>,</sup><xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, R(ACG)<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>, N(GUU)<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref>,L(UAG)</italic></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="TN1">
<label>a</label>
<p><italic>Gene containing two introns</italic>.</p></fn>
<fn id="TN2">
<label>b</label>
<p><italic>Gene containing a single intron</italic>.</p></fn>
<fn id="TN3">
<label>c</label>
<p><italic>Two gene copies in the IRs</italic>.</p></fn>
<fn id="TN4">
<label>d</label>
<p><italic>Gene divided into two independent transcription units</italic>.</p></fn>
<fn id="TN5">
<label>e</label>
<p><italic>Pseudogenes</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The average AT content of the cp genome is 66% for both genotypes (Table <xref ref-type="table" rid="T2">2</xref>), which is found to be in similar range, reported for the legumes including <italic>G. max</italic> (64.63%) and <italic>C. arietinum</italic> (66.1%). Individually the AT content of the LSC and SSC regions is 68% and 72% in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>. The AT content of IR region is 58% in both and is consistent with findings for other cp genomes. The low AT content of the IR region may be due to the reduced presence of AT nucleotides in the four rRNA genes (<italic>rrn16, rrn23, rrn5</italic>, and <italic>rrn4.5</italic>) present in IR region. The increased sequence complexity of the IR regions may help in the stabilization of the genome as it has been reported in the past that the legume plastids which have lost one copy of IR are more prone to rearrangements as compared to those genomes which have retained the IR copy (Palmer and Thompson, <xref ref-type="bibr" rid="B61">1982</xref>).</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p><bold>Features of the chloroplast genome of <italic>C. scarabaeoides</italic> (Cs) and <italic>C. cajan</italic> (Cc)</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th/>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>T/U%</bold></th>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>C%</bold></th>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>A%</bold></th>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>G%</bold></th>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>Length (bp)</bold></th>
<th valign="top" align="center" colspan="2" style="border-bottom: thin solid #000000;"><bold>AT%</bold></th>
</tr>
<tr>
<th/>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
<th valign="top" align="center"><bold>Cs</bold></th>
<th valign="top" align="center"><bold>Cc</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Genome</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">152,201</td>
<td valign="top" align="center">152,242</td>
<td valign="top" align="center">66</td>
<td valign="top" align="center">66</td>
</tr>
<tr>
<td valign="top" align="left">LSC</td>
<td valign="top" align="center">34</td>
<td valign="top" align="center">34</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">34</td>
<td valign="top" align="center">34</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">83,423</td>
<td valign="top" align="center">83,455</td>
<td valign="top" align="center">68</td>
<td valign="top" align="center">68</td>
</tr>
<tr>
<td valign="top" align="left">SSC</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">36</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">17,854</td>
<td valign="top" align="center">17,871</td>
<td valign="top" align="center">72</td>
<td valign="top" align="center">72</td>
</tr>
<tr>
<td valign="top" align="left">IR</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">25,402</td>
<td valign="top" align="center">25,398</td>
<td valign="top" align="center">58</td>
<td valign="top" align="center">58</td>
</tr>
<tr>
<td valign="top" align="left">Prt.Coding genes</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">31</td>
<td valign="top" align="center">31</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">79,052</td>
<td valign="top" align="center">75,031</td>
<td valign="top" align="center">63</td>
<td valign="top" align="center">63</td>
</tr>
<tr>
<td valign="top" align="left">tRNA</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">28</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">2888</td>
<td valign="top" align="center">2888</td>
<td valign="top" align="center">48</td>
<td valign="top" align="center">48</td>
</tr>
<tr>
<td valign="top" align="left">rRNA</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">9054</td>
<td valign="top" align="center">9054</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">45</td>
</tr>
<tr>
<td valign="top" align="left">First position</td>
<td valign="top" align="center">32.1</td>
<td valign="top" align="center">32.1</td>
<td valign="top" align="center">17.5</td>
<td valign="top" align="center">17.5</td>
<td valign="top" align="center">31.8</td>
<td valign="top" align="center">31.8</td>
<td valign="top" align="center">18.3</td>
<td valign="top" align="center">18.3</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">64</td>
<td valign="top" align="center">64</td>
</tr>
<tr>
<td valign="top" align="left">Second position</td>
<td valign="top" align="center">33.02</td>
<td valign="top" align="center">33.02</td>
<td valign="top" align="center">17.23</td>
<td valign="top" align="center">17.23</td>
<td valign="top" align="center">32.77</td>
<td valign="top" align="center">32.77</td>
<td valign="top" align="center">16.96</td>
<td valign="top" align="center">16.96</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">65.79</td>
<td valign="top" align="center">65.79</td>
</tr>
<tr>
<td valign="top" align="left">Third position</td>
<td valign="top" align="center">32.3</td>
<td valign="top" align="center">32.3</td>
<td valign="top" align="center">16.6</td>
<td valign="top" align="center">16.6</td>
<td valign="top" align="center">32.9</td>
<td valign="top" align="center">32.9</td>
<td valign="top" align="center">18.1</td>
<td valign="top" align="center">18.1</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">50,747</td>
<td valign="top" align="center">64.5</td>
<td valign="top" align="center">64.5</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Protein coding regions account for 49.2% of the whole genome while tRNA and rRNA accounts for 1.9% and 5.9% respectively in <italic>C. cajan</italic>, whereas in <italic>C. scarabaeoides</italic>, protein coding region accounts for 51.9% while 1.9% and 5.9% are accounted by tRNA and rRNA regions respectively. The remaining region consists of non-coding sequences which include intergenic regions, introns and pseudogenes.</p>
<p>In the cp genome of <italic>C. scarabaeoides</italic>, a total of 79,052 nt and 26,350 codons represent the coding capacity of 78 protein coding genes. Among these, leucine (2898 codons, 10.99% of the total) represents the most abundant amino acid whereas cysteine (354 codons, 1.34% of the total) represents the least abundant amino acid. Similarly, in the <italic>C. cajan</italic>, 78 protein coding genes are represented by 75,031 nt and 25,010 codons. Here too leucine (2264 codons, 9.05%) is the most abundant amino acid and cysteine (416 codons, 1.66%) is the least abundant amino acid (Supplementary Tables <xref ref-type="supplementary-material" rid="SM2">S2</xref>, <xref ref-type="supplementary-material" rid="SM3">S3</xref>). Leucine and cysteine are reported as the most and least abundant amino acids respectively in other cp genomes also (Chen et al., <xref ref-type="bibr" rid="B6">2015</xref>; Curci et al., <xref ref-type="bibr" rid="B10">2015</xref>; Redwan et al., <xref ref-type="bibr" rid="B70">2015</xref>). It has been suggested in previous studies that there is a significant relationship between codon usage bias and gene expression level (Iannacone et al., <xref ref-type="bibr" rid="B28">1997</xref>; Rouwendal et al., <xref ref-type="bibr" rid="B71">1997</xref>), therefore it implies that there is a strong natural selection pressure on highly expressed genes to optimize their translation efficiency by using major codons (Bulmer, <xref ref-type="bibr" rid="B3">1988</xref>). The codon usage is biased toward the high representation of A and T at the third codon position (Table <xref ref-type="table" rid="T2">2</xref>). The biasness for A and T nucleotide at third codon position is also shown by RSCU analysis for instance, for valine the codon ending with A and T are 36.5% whereas those ending with G and C are 14.75 and 12.25% respectively. Such biasness for high representation of A and T at third codon position is also observed in other land plant plastid genomes (Yang et al., <xref ref-type="bibr" rid="B97">2014</xref>; Yao et al., <xref ref-type="bibr" rid="B98">2015</xref>). It may be due to the compositional bias toward AT rich content (Morton, <xref ref-type="bibr" rid="B50">2003</xref>; Williams et al., <xref ref-type="bibr" rid="B90">2015</xref>). As all cp genomes have high AT content, AT biased mutational pressure and its prokaryotic origins are believed to be the factors responsible for codon usage bias.</p>
<p>There are 12 intron containing genes in both the genotypes. Among these, 10 genes (5 protein coding genes and 5 tRNA genes) have a single intron and 2 genes (<italic>ycf3</italic> and <italic>clpP</italic>) have two introns each. <italic>Cicer, Medicago, Trifolium, P. sativum</italic>, and <italic>L. sativus</italic> has lost the <italic>clpP</italic> introns and this loss provides support for the monophyly of IRLC (Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>). On the other hand, <italic>Acacia liguata</italic>, a member of Mimosoideae subfamily of legumes retains both the introns of clpP. The intron containing genes are distributed throughout the genome with 7 genes present in the LSC region and 5 genes present in IR region of both the genotypes (Supplementary Tables <xref ref-type="supplementary-material" rid="SM4">S4</xref>, <xref ref-type="supplementary-material" rid="SM5">S5</xref>). Among the intron containing genes, <italic>trnK-UUU</italic> has the largest intron in both the plastids (2593 bp in <italic>C. scarabaeoides</italic> and 2594 bp in <italic>C. cajan</italic>) and likewise this intron also contains <italic>matK</italic> gene, which is consistent with other legume plastid genomes (Saski et al., <xref ref-type="bibr" rid="B73">2005</xref>; Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>). Koch et al. (<xref ref-type="bibr" rid="B36">1981</xref>) demonstrated for first time the presence of intron in cp <italic>trna</italic> genes, <italic>trnI</italic>, and <italic>trnA</italic>. Some recent studies have suggested that, introns play an important role in the regulation of gene expression and therefore improve exogenous gene expression, resulting in the enhanced plastome efficiency (Xu et al., <xref ref-type="bibr" rid="B95">2003</xref>).</p>
<p>It was observed that <italic>rpl22</italic> and <italic>infA</italic> genes are absent from the plastid genome of both genotypes. The absence of <italic>rpl22</italic> gene is also observed in <italic>G. max</italic> (Saski et al., <xref ref-type="bibr" rid="B73">2005</xref>), <italic>T. subterraneum</italic> (Cai et al., <xref ref-type="bibr" rid="B5">2008</xref>), and <italic>Lotus japonicus</italic> (Kato et al., <xref ref-type="bibr" rid="B33">2000</xref>). Molecular analysis suggested the transfer of <italic>rpl22</italic> gene to nucleus from the cp genome, as a functional copy of this gene has been found from the nuclear genome of <italic>P. sativum</italic> (Gantt et al., <xref ref-type="bibr" rid="B20">1991</xref>). Also a functional copy of <italic>rpl22</italic> gene was verified in the nucleus of lupine species (Martin et al., <xref ref-type="bibr" rid="B47">2014</xref>). The gene <italic>infA</italic> has been lost from cp genome to nucleus in the course of angiosperm evolution in almost all rosids (Millen et al., <xref ref-type="bibr" rid="B48">2001</xref>). A pseudogene <italic>rps16</italic> is present in the plastid genome of both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>, whereas it has been lost from the genome of <italic>C. arietinum</italic> (Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>), <italic>M. truncatula</italic> (Young et al., <xref ref-type="bibr" rid="B100">2011</xref>) and is present as a non-functional copy in <italic>V. radiata</italic> (Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>). The loss of <italic>rps16</italic> has occurred multiple times from the legumes (Doyle et al., <xref ref-type="bibr" rid="B17">1995</xref>). Gene substitution has been identified as the mechanism for loss of <italic>rps16</italic> gene from cp genomes of <italic>Populus</italic> and <italic>Medicago</italic> (Ueda et al., <xref ref-type="bibr" rid="B86">2008</xref>). The dual targeting of mt. ribosomal protein S16 (encoded by nuclear gene) to mitochondria as well as to chloroplast compensates for the loss of cp <italic>rps16</italic> gene. Another gene, <italic>rpl33</italic> observed to be present in <italic>C. scarabaeoides, C. cajan, Vigna</italic>, and <italic>Phaseolus</italic> (Guo et al., <xref ref-type="bibr" rid="B21">2007</xref>) is also a pseudogene as it contains a premature stop codon within the coding region.</p>
<p>Among the five completely sequenced legume plastid genomes, three genomes (<italic>Cicer, Glycine</italic>, and <italic>Medicago</italic>) lack the <italic>ycf4 gene</italic> whereas it is present in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>. Magee et al. (<xref ref-type="bibr" rid="B43">2010</xref>) identified a 1.5 kb long region having dramatically high rate of evolution coinciding with <italic>ycf4</italic> gene. It has been found that <italic>ycf4</italic> has evolved much faster in most legumes than in other angiosperms. It is reported to be lost from the cp genome of <italic>Lathyrus odoratus</italic> (Magee et al., <xref ref-type="bibr" rid="B43">2010</xref>) and either absent or present as a pseudogene in <italic>P. sativum</italic> (Nagano et al., <xref ref-type="bibr" rid="B52">1991</xref>; Smith et al., <xref ref-type="bibr" rid="B81">1991</xref>). It has been established by slot-blot hybridization experiments that ycf4 may have been lost independently multiple times in different lineages of legumes (Doyle et al., <xref ref-type="bibr" rid="B17">1995</xref>). Magee et al. (<xref ref-type="bibr" rid="B43">2010</xref>) also reported a very interesting finding that ycf4 gene which was reported absent from the cp genome of <italic>G. max, T. subterraneum, Cicer arientinum</italic> and <italic>M. truncatula</italic> was present in all the cp genomes but as the gene is so divergent, DOGMA (Wyman et al., <xref ref-type="bibr" rid="B94">2004</xref>) was not able to annotate them.</p>
<p>The two pseudogenes <italic>ycf15</italic> and <italic>ycf68</italic> present in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>, seem to contain premature stop codons, similar to that observed in <italic>V. radiata</italic> and <italic>P. vulgaris.</italic> In Artichoke, <italic>ycf68</italic> is reported to be a pseudogene (Curci et al., <xref ref-type="bibr" rid="B10">2015</xref>), while both <italic>ycf15</italic> and 68 are reported as pseudogenes in sweet potato (Yan et al., <xref ref-type="bibr" rid="B96">2015</xref>). The <italic>accD</italic> gene which was reported to be relocated to nucleus in <italic>Trifolium</italic> species (Cai et al., <xref ref-type="bibr" rid="B5">2008</xref>) is present in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>, and all the other sequenced legumes (Guo et al., <xref ref-type="bibr" rid="B21">2007</xref>; Jansen et al., <xref ref-type="bibr" rid="B32">2008</xref>). It has been reported that <italic>accD</italic> shows considerable length variation among the legumes that retains it. The increased rate of sequence evolution and localized hypermutation has led to the phenomenon of gene loss or relocation to nucleus in legumes (Magee et al., <xref ref-type="bibr" rid="B43">2010</xref>). Among the angiosperms, legumes are more prone to rearrangements and gene losses (Palmer et al., <xref ref-type="bibr" rid="B59">1988</xref>). Mostly the genes coding for ribosomal proteins have been lost during the evolution from the plastid genome. There are no reports for the loss of genes related to electron transport chain, atp synthesis or those associated with photosystem I and II (Jansen et al., <xref ref-type="bibr" rid="B30">2007</xref>).</p>
</sec>
<sec><title>Gene order</title>
<p>The cp genomes of <italic>C. cajan</italic> and <italic>C. scarabaeoides</italic> were aligned with the cp genomes of previously reported legumes by including <italic>Arabidopsis</italic> cp genome as reference with help of Mauve software (Darling et al., <xref ref-type="bibr" rid="B11">2004</xref>; Figure <xref ref-type="fig" rid="F3">3</xref>). All the legume cp genomes generally shared the same gene order but the major difference among them was absence of IRb region in <italic>Cicer</italic> and <italic>Medicago</italic>. The cp genome of <italic>Cicer</italic> has lost one copy of the IR, a feature also shared by <italic>Medicago</italic>. Lavin et al. (<xref ref-type="bibr" rid="B37">1990</xref>) reported the loss of one copy of inverted repeat in six legume tribes including Galegeae, Hedysareae, Carmichaelieae, Vicieae, Cicereae, and Trifolieae. All these legume tribes form a new clade called IRLC (inverted-repeat-lacking clade; Palmer et al., <xref ref-type="bibr" rid="B58">1987</xref>; Cronk et al., <xref ref-type="bibr" rid="B8">2006</xref>). The cp genomes possessing the inverted repeat have a very conserved and stable genomic structure while the genomes which have lost one copy of inverted repeat have undergone extensive genomic rearrangements (e.g., <italic>Vicia, Trifolium, Pisum</italic>; Palmer and Thompson, <xref ref-type="bibr" rid="B61">1982</xref>; Doyle et al., <xref ref-type="bibr" rid="B17">1995</xref>).</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p><bold>Gene order comparison of legume cp genomes, with Arabidopsis cp genome as reference, using MAUVE software</bold>. The boxes above the line represent the gene sequence in clockwise direction and the boxes below the line represent gene sequences in opposite orientation. The gene names at the bottom indicate the genes located at the boundaries of the boxes in cp genome of pigeonpea. AKPA1- <italic>C. scarabaeoides</italic>, AKPR375<italic>- C. cajan.</italic></p></caption>
<graphic xlink:href="fpls-07-01847-g0003.tif"/>
</fig>
<p>All the legume genomes have a common 50-kb inversion as compared to <italic>Arabidopsis</italic> cp genome. This inversion spans the region between <italic>rbc</italic>l and <italic>rps16</italic> in the LSC region. This inversion was described for the first time in <italic>P. sativum, V. faba</italic>, and <italic>V. radiata</italic> (Palmer and Thompson, <xref ref-type="bibr" rid="B61">1982</xref>) and is confined to Papilionoideae subfamily of leguminosae (Doyle et al., <xref ref-type="bibr" rid="B14">1996</xref>).</p>
<p>Another inversion of 78-kb is present in cp genome of <italic>V. radiata</italic> and <italic>P. vulgaris</italic> but absent from other legume cp genomes, was originally reported in subtribe phaseolinae (<italic>Vigna</italic> and <italic>Phaseolus</italic>). The inversion spans the region between <italic>trnH-GUG/rpl14</italic> and <italic>rps19/rps8</italic>. This 78-kb inversion may have resulted due to expansion and subsequent contraction of the inverted repeats (Bruneau et al., <xref ref-type="bibr" rid="B2">1990</xref>).</p>
<p>The cp genome of both pigeonpea genotypes displays one more inversion between the LSC and IRs which is common with <italic>G. max</italic>. This may be the result of flip-flop intramolecular recombination occurring in the plastome (Palmer, <xref ref-type="bibr" rid="B56">1983</xref>). The rearrangements such as inversions in the chloroplast genome of land plants are rare and they have proven to be useful markers for phylogenetic analysis (Jansen and Palmer, <xref ref-type="bibr" rid="B31">1987</xref>; Doyle et al., <xref ref-type="bibr" rid="B15">1992</xref>; Raubeson and Jansen, <xref ref-type="bibr" rid="B69">1992</xref>) in a number of groups such as legumes (Bruneau et al., <xref ref-type="bibr" rid="B2">1990</xref>). Therefore, these rearrangements are indicative of the diversity observed in the cpDNA organization of legume plants.</p>
</sec>
<sec><title>Comparison with other legume genomes</title>
<p>The sequence identity of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> cp genome was plotted using mVISTA (Figure <xref ref-type="fig" rid="F4">4</xref>). The coding regions were found to be more conserved than the non-coding regions, as also reported for other cp genomes. The IR regions were found to be more conserved than the single copy regions probably due to the phenomenon of copy correction between IR sequences by gene conversion (Khakhlova and Bock, <xref ref-type="bibr" rid="B34">2006</xref>). Another explanation for the conservation of IR is the presence of conserved rRNA genes in the IR region. The coding regions showing high degree of variation are <italic>accD, cemA, petA, psbT</italic>, and <italic>clpP</italic> as also reported for other cp genomes (Yang et al., <xref ref-type="bibr" rid="B97">2014</xref>; Yao et al., <xref ref-type="bibr" rid="B98">2015</xref>). The intergenic region between <italic>trnC-GCA&#x02013;psbD, petD-rps3, psbK-accD, petA-psbT trnK-UUU- rbcL</italic>, and <italic>ndhJ&#x02013;ycf3</italic> show high sequence divergence among the legumes aligned.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p><bold>Sequence alignment of legume cp genomes, with <italic>C. cajan</italic> cp genome set as a reference using mVista</bold>. Position and transcriptional direction of each gene is indicated by gray arrows. Intergenic and genic regions are indicated by red and blue areas respectively. Sequence identity between the cp genomes is shown on y-axis as a percentage between 50 and 100%. AKPA1- <italic>C. scarabaeoides</italic>, AKPR375<italic>- C. cajan.</italic></p></caption>
<graphic xlink:href="fpls-07-01847-g0004.tif"/>
</fig>
</sec>
<sec><title>IR boundaries</title>
<p>The IR regions are resistant to recombinational loss and therefore help in the stabilization of the cp genome (Perry and Wolfe, <xref ref-type="bibr" rid="B63">2002</xref>). Both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> possesses the smallest IR among the legumes and includes 21 completely duplicated genes. At IR/LSC junction <italic>rps19</italic> gene is excluded from the IR, rather <italic>rpl2</italic> gene is included and hence the whole <italic>rpl2</italic> gene is duplicated and included in the IR. Subsequently the IR merges into <italic>ycf1</italic> gene at IR/SSC junction with 448 bp and 444 bp of <italic>ycf1</italic> gene included in the IR region of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. On comparing the cp genomes of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> with other legumes it was observed that <italic>rps19</italic> gene (68 bp) was included in the IR region of <italic>G. max</italic> and showed partial duplication while in <italic>V. radiata</italic> and <italic>P. vulgaris</italic> the complete <italic>rps19</italic> gene was included and hence duplicated in the IR region. This feature however varies between the legumes as <italic>rps19</italic> gene is absent from the IR of <italic>Millettia</italic> and <italic>Lupinus</italic> (Williams et al., <xref ref-type="bibr" rid="B90">2015</xref>), which is similar to that observed in pigeonpea. On the other hand, at IR/SSC junction, the <italic>ycf1</italic> gene is included in the IR in all the legumes but to different extents (Figure <xref ref-type="fig" rid="F5">5</xref>). Absence of <italic>rps19</italic> gene from the IR of pigeonpea plastid genome makes it smallest among all legumes leading to a bigger SSC region. This phenomenon of IR expansion and contraction could have resulted into the size variation among the legume cp genomes.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p><bold>Comparison of the border positions of LSC, SSC, and IR regions among the legume genomes</bold>. Genes are denoted by boxes and the gaps between the genes and the boundaries are indicated by number of bases unless the gene coincides with the boundary. Extensions of the genes are also indicated above the boxes. AKPA1- <italic>C. scarabaeoides</italic>, AKPR375<italic>- C. cajan.</italic></p></caption>
<graphic xlink:href="fpls-07-01847-g0005.tif"/>
</fig>
</sec>
<sec><title>RNA editing sites in transcripts from <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic></title>
<p>Editing sites in the cp DNA of pigeonpea genotypes were identified by PREP-cp program. It predicted 63 editing sites in 23 genes in <italic>C. scarabaeoides</italic> and 62 editing sites in 22 genes in <italic>C. cajan</italic>. Validation of the editing sites was done by mapping the transcriptome reads onto the DNA sequences from chloroplast and the sites having minimum 5X coverage were considered. Confirmation of editing at 37 sites in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> was observed. In addition, 8 editing sites in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> were identified, which were not predicted by PREPcp. Among all the genes analyzed, <italic>ndh</italic> gene displays the maximum number of editing sites (Supplementary Tables <xref ref-type="supplementary-material" rid="SM6">S6</xref>, <xref ref-type="supplementary-material" rid="SM7">S7</xref>), <italic>ndh</italic> genes have been reported to contain maximum number of editing sites (Corneille et al., <xref ref-type="bibr" rid="B7">2000</xref>; Huang et al., <xref ref-type="bibr" rid="B27">2013</xref>), since they are considered to be dispensable (Burrows et al., <xref ref-type="bibr" rid="B4">1998</xref>; Shikanai et al., <xref ref-type="bibr" rid="B78">1998</xref>), therefore accumulation of editing sites may have been permitted in <italic>ndh</italic> transcript due to dearth of stringent requirement of <italic>ndh</italic> function.</p>
<p>The editing type observed was 100% C&#x02013;U, out of which 13.5% were silent, and 86.4% non-silent in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>. Silent editing occurs due to change in the third codon position which therefore does not lead to any amino acid change (Maier et al., <xref ref-type="bibr" rid="B45">1996</xref>). Though silent RNA editing is frequent in mitochondrial genome which could account for 30% but it was reported for the first time in tobacco chloroplast genome at only one site in <italic>atpA</italic> gene (Hirose et al., <xref ref-type="bibr" rid="B23">1996</xref>).</p>
<p>The editing event was most frequent at 2nd codon position in pigeonpea cp genome with 78.3% of editing occurring at 2nd position in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>. Among the amino acid changes 23 were converted from hydrophilic to hydrophobic and 1 amino acid from hydrophobic to hydrophilic in <italic>C. scarabaeoides</italic>. Similarly, 23 amino acids were converted from hydrophilic to hydrophobic and 1 amino acid from hydrophobic to hydrophilic in <italic>C. cajan</italic>. In both the genomes maximum conversion was observed for serine to leucine (45.9%). As evident from the results editing changes lead to increased number of hydrophobic amino acids as compared to hydrophilic amino acids in both the genotypes. These results are consistent with findings in other cp genomes also (Lee et al., <xref ref-type="bibr" rid="B38">2014</xref>; Raman and Park, <xref ref-type="bibr" rid="B67">2015</xref>). This bias might reflect the codon usage of plant plastome or may be the result of constraints due to the editing mechanism. For example, amino acid leucine may be preferred as it is a hydrophobic amino acid therefore prefers to be buried in the protein hydrophobic cores and hence involved in binding/recognition of hydrophobic ligands such as lipids.</p>
<p>Generally, the editing occurs in protein coding regions of chloroplast to restore the evolutionary conserved amino acids sequence (Maier et al., <xref ref-type="bibr" rid="B45">1996</xref>). Like in pigeonpea cp genome, the frequency of editing sites is similar to that observed in other legumes like Pea (Inada et al., <xref ref-type="bibr" rid="B29">2004</xref>) and <italic>V. radiata</italic> (Lin et al., <xref ref-type="bibr" rid="B40">2015</xref>). Generally the editing sites vary between 20 and 37 in angiosperms (Hirose et al., <xref ref-type="bibr" rid="B24">1999</xref>; Corneille et al., <xref ref-type="bibr" rid="B7">2000</xref>; Lutz and Maliga, <xref ref-type="bibr" rid="B42">2001</xref>). On the basis of comparison of editing frequencies and patterns it has been predicted that RNA editing is specific to a particular species. Although, editing has been found in all major lineages of land plants but its pattern does not correspond to the position of a particular species in the phylogenetic tree (Freyer et al., <xref ref-type="bibr" rid="B19">1997</xref>).</p>
</sec>
<sec><title>Microsatellite mining</title>
<p>Chloroplast microsatellites (cpSSRs) are highly polymorphic due to the conserved gene order, non-recombinant and uniparentally inherited nature of the chloroplast genome (cpDNA) making them useful tools for studying phylogenetic relationships in plants (Olmstead and Palmer, <xref ref-type="bibr" rid="B54">1994</xref>). We analyzed chloroplast SSRs (cpSSRs) with the MISA perl script and a total of 280 and 292 cpSSRs were identified in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. The number was higher than that of cpSSRs identified in <italic>V. radiata, Sesamum indicum</italic> and <italic>Camellia</italic> species (Yi and Kim, <xref ref-type="bibr" rid="B99">2012</xref>; Huang et al., <xref ref-type="bibr" rid="B26">2014</xref>; Lin et al., <xref ref-type="bibr" rid="B40">2015</xref>). Of the 280 repeats identified in <italic>C. scarabaeoides</italic>: 71.07% (199 SSRs) were located in the LSC region, 17.85% (50 SSRs) in the SSC region and 31% (11.07 SSRs) in the IR regions. In contrast, out of the 292 repeat motifs identified in <italic>C. cajan</italic>, 72.26% (211 SSRs) were present in LSC region, 17.46% (51 SSRs) in the SSC region and the remaining 10.27% (30 SSRs) were located in the IR regions, as reported in other plants like olives and artichoke (Mariotti et al., <xref ref-type="bibr" rid="B46">2010</xref>; Curci et al., <xref ref-type="bibr" rid="B10">2015</xref>). Furthermore, the SSR repeats were distributed among three different regions: coding sequence, intronic sequence, and intergenic spacer regions (Figure <xref ref-type="fig" rid="F6">6</xref>). 171 (61%) and 193 (66%) SSRs were located in the intergenic spacer regions of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. Followed by 71 (25%) and 65 (22%) SSRs in the coding sequence and the remaining 38 (14%) and 34 (12%) repeats were present in the intronic regions. These results were in accordance with those reported in <italic>G. max</italic> (Ozyigit et al., <xref ref-type="bibr" rid="B55">2015</xref>) indicating high degree of homology and conserved nature of genomes.</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p><bold>Repeat distribution among three different regions: coding sequences, intronic sequences, and intergenic spacer regions (A)</bold> AKPA1 (<italic>C. scarabaeoides</italic>); <bold>(B)</bold> AKPR375 (<italic>C. cajan)</italic>.</p></caption>
<graphic xlink:href="fpls-07-01847-g0006.tif"/>
</fig>
<p>Of the SSRs identified, 49.28% (138 SSRs) and 45.89% (134 SSRs) were perfect repeats in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. While 5.7%, 0.35% and 14.6% SSRs constituted imperfect, compound and compound imperfect repeats in <italic>C. scarabaeoides</italic> and 6.16%, 0.3%, 15.41% SSRs in <italic>C. cajan</italic> respectively.</p>
<p>Among the repeat types, the most abundant repeat was found to be mononucleotides in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> (Figure <xref ref-type="fig" rid="F7">7</xref>), with no hexa- repeats identified in both the genotypes and were distributed among the coding and non-coding regions (Figures <xref ref-type="fig" rid="F8">8A,B</xref>). The findings were in agreement with those in <italic>Sesame</italic> (Yi and Kim, <xref ref-type="bibr" rid="B99">2012</xref>) and olive species (Mariotti et al., <xref ref-type="bibr" rid="B46">2010</xref>). Majority of the microsatellites in the chloroplast genome are mononucleotide A/T repeats (Wheeler et al., <xref ref-type="bibr" rid="B89">2014</xref>). Likewise, mononucleotides A/T were predominant in both pigeonpea genotypes which is in agreement with results from previous studies in <italic>Oryza sativa, V. radiata, Camellia</italic> species and <italic>Sesame indicum</italic> (Rajendrakumar et al., <xref ref-type="bibr" rid="B66">2007</xref>; Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>; Yi and Kim, <xref ref-type="bibr" rid="B99">2012</xref>; Huang et al., <xref ref-type="bibr" rid="B26">2014</xref>). AT/TA (93.10%) was most frequent dinucleotide motifs followed by AG/TC in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. Higher frequency of AT/TA motifs was also reported in <italic>Glycine</italic> species, olive species and <italic>Sesamum indicum</italic> (Mariotti et al., <xref ref-type="bibr" rid="B46">2010</xref>; Yi and Kim, <xref ref-type="bibr" rid="B99">2012</xref>; Ozyigit et al., <xref ref-type="bibr" rid="B55">2015</xref>). AAT/TTA and AAAT/TTTA were the most frequent trinucleotide and tetranucleotide motifs followed by ATT/TAA and AATA/ TTAT in both <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic>. Only one pentanucleotide motif TATTA/ATAAT was identified in the <italic>C. cajan</italic>, while no hexameric repeats were observed. This is evident from the AT bias the plastid genomes seems to possess.</p>
<fig id="F7" position="float">
<label>Figure 7</label>
<caption><p><bold>SSR distribution on the basis of repeat type</bold>.</p></caption>
<graphic xlink:href="fpls-07-01847-g0007.tif"/>
</fig>
<fig id="F8" position="float">
<label>Figure 8</label>
<caption><p><bold>SSR type distribution between coding and non-coding regions (A)</bold> AKPA1 (<italic>C. scarabaeoides</italic>); <bold>(B)</bold> AKPR375 (<italic>C. cajan)</italic>.</p></caption>
<graphic xlink:href="fpls-07-01847-g0008.tif"/>
</fig>
<p>The chloroplast gene possessing the highest number of repeats was <italic>ycf1</italic> in both the genotypes (Supplementary Tables <xref ref-type="supplementary-material" rid="SM8">S8</xref>, <xref ref-type="supplementary-material" rid="SM9">S9</xref>). Our findings are in agreement with those from <italic>Glycine</italic> species, <italic>V. radiata, Camellia</italic> species, <italic>Cynara cardunculus</italic> (Tangphatsornruang et al., <xref ref-type="bibr" rid="B82">2010</xref>; Huang et al., <xref ref-type="bibr" rid="B26">2014</xref>; Curci et al., <xref ref-type="bibr" rid="B10">2015</xref>; Ozyigit et al., <xref ref-type="bibr" rid="B55">2015</xref>). Dong et al. (<xref ref-type="bibr" rid="B13">2012</xref>) expressed <italic>ycf1</italic> gene as the most variable locus accordingly highly variable SSRs can be located in the <italic>ycf1</italic> coding region of the pigeonpea cp genome.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="s4"><title>Conclusion</title>
<p>The draft cp genome of <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> were sequenced by Roche-454 technology. This is the first study reporting the sequence of pigeonpea cp genome. The pigeonpea cp genome is similar to other legume cp genomes, in terms of cp genome size and number of unique genes. The organization of pigeonpea cp genome shows similarity to other legume cp genomes except for IR contraction and hence exclusion of <italic>rps19</italic> gene from the IR. The genes <italic>rps16, rpl33, ycf15, ycf68</italic>, and <italic>ycf1</italic> were observed as pseudogenes and <italic>rpl22</italic> and <italic>infA</italic> are absent from the pigeonpea cp genome. RNA editing was also observed at 37 sites in both plastids, particularly in <italic>ndh</italic> gene region. Chloroplast SSRs were also mined, with 280 and 292 cpSSRs being identified in <italic>C. scarabaeoides</italic> and <italic>C. cajan</italic> respectively. This study would be helpful in phylogenetic and evolutionary studies of pigeonpea with other legumes.</p>
</sec>
<sec id="s5"><title>Author contributions</title>
<p>TK carried out the experiments, prepared the genomic library for Roche sequencing and sequencing run and wrote the manuscript. PC performed chloroplast genome assembly and bioinformatics analysis. SS carried out the SSR markers discovery and validation. TK, PC, SS, and KB were involved in the result interpretation, analysis, and finalization of the manuscript. NS, TS, and AC contributed in data analysis, genome annotation, and manuscript finalization. SG provided the germplasm and assisted in data analysis. KG conceived the study, designed the experiments, and coordinated the work. All the authors have read and approved the final manuscript.</p>
<sec><title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<ack><p>We acknowledge the financial support received from ICAR-National Research Centre on Plant Biotechnology and technical support from Roche India.</p>
</ack>
<sec sec-type="supplementary-material" id="s6"><title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fpls.2016.01847/full#supplementary-material">http://journal.frontiersin.org/article/10.3389/fpls.2016.01847/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table1.DOCX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.DOCX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.DOCX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table4.docx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table5.DOCX" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table6.DOCX" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table7.DOCX" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table8.DOCX" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table9.DOCX" id="SM9" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Bock</surname> <given-names>R.</given-names></name></person-group> (<year>2007</year>). <article-title>Structure, function, and inheritance of plastid genomes</article-title>, in <source>Cell and Molecular Biology of Plastids</source>, ed <person-group person-group-type="editor"><name><surname>Bock</surname> <given-names>R.</given-names></name></person-group>(<publisher-loc>Berlin; Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>29</fpage>&#x02013;<lpage>63</lpage>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bruneau</surname> <given-names>A.</given-names></name> <name><surname>Doyle</surname> <given-names>J. J.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1990</year>). <article-title>A Chloroplast DNA Inversion as a subtribal character in the Phaseoleae (Leguminosae)</article-title>. <source>Syst. Bot.</source> <volume>15</volume>, <fpage>378</fpage>&#x02013;<lpage>386</lpage>. <pub-id pub-id-type="doi">10.2307/2419351</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bulmer</surname> <given-names>M.</given-names></name></person-group> (<year>1988</year>). <article-title>Are codon usage patterns in unicellular organisms determined by selection-mutation balance?</article-title> <source>J. Evol. Biol.</source> <volume>1</volume>, <fpage>15</fpage>&#x02013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1046/j.1420-9101.1988.1010015.x</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burrows</surname> <given-names>P. A.</given-names></name> <name><surname>Sazanov</surname> <given-names>L. A.</given-names></name> <name><surname>Svab</surname> <given-names>Z.</given-names></name> <name><surname>Maliga</surname> <given-names>P.</given-names></name> <name><surname>Nixon</surname> <given-names>P. J.</given-names></name></person-group> (<year>1998</year>). <article-title>Identification of a functional respiratory complex in chloroplasts through analysis of tobacco mutants containing disrupted plastid ndh genes</article-title>. <source>EMBO J.</source> <volume>17</volume>, <fpage>868</fpage>&#x02013;<lpage>876</lpage>. <pub-id pub-id-type="doi">10.1093/emboj/17.4.868</pub-id><pub-id pub-id-type="pmid">9463365</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cai</surname> <given-names>Z.</given-names></name> <name><surname>Guisinger</surname> <given-names>M.</given-names></name> <name><surname>Kim</surname> <given-names>H. G.</given-names></name> <name><surname>Ruck</surname> <given-names>E.</given-names></name> <name><surname>Blazier</surname> <given-names>J. C.</given-names></name> <name><surname>McMurtry</surname> <given-names>V.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>Extensive reorganization of the plastid genome of <italic>Trifolium subterraneum</italic> (Fabaceae) is associated with numerous repeated sequences and novel DNA insertions</article-title>. <source>J. Mol. Evol.</source> <volume>67</volume>, <fpage>696</fpage>&#x02013;<lpage>704</lpage>. <pub-id pub-id-type="doi">10.1007/s00239-008-9180-7</pub-id><pub-id pub-id-type="pmid">19018585</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Hao</surname> <given-names>Z.</given-names></name> <name><surname>Xu</surname> <given-names>H.</given-names></name> <name><surname>Yang</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>G.</given-names></name> <name><surname>Sheng</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>The complete chloroplast genome sequence of the relict woody plant Metasequoia glyptostroboides Hu et Cheng</article-title>. <source>Front. Plant Sci.</source> <volume>6</volume>:<fpage>447</fpage>. <pub-id pub-id-type="doi">10.3389/fpls.2015.00447</pub-id><pub-id pub-id-type="pmid">26136762</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Corneille</surname> <given-names>S.</given-names></name> <name><surname>Lutz</surname> <given-names>K.</given-names></name> <name><surname>Maliga</surname> <given-names>P.</given-names></name></person-group> (<year>2000</year>). <article-title>Conservation of RNA editing between rice and maize plastids: are most editing events dispensable?</article-title> <source>Mol. Gen. Genet.</source> <volume>264</volume>, <fpage>419</fpage>&#x02013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.1007/s004380000295</pub-id><pub-id pub-id-type="pmid">11129045</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cronk</surname> <given-names>Q.</given-names></name> <name><surname>Ojeda</surname> <given-names>I.</given-names></name> <name><surname>Pennington</surname> <given-names>R. T.</given-names></name></person-group> (<year>2006</year>). <article-title>Legume comparative genomics: progress in phylogenetics and phylogenomics</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>9</volume>, <fpage>99</fpage>&#x02013;<lpage>103</lpage>. <pub-id pub-id-type="doi">10.1016/j.pbi.2006.01.011</pub-id><pub-id pub-id-type="pmid">16480916</pub-id></citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cronn</surname> <given-names>R.</given-names></name> <name><surname>Liston</surname> <given-names>A.</given-names></name> <name><surname>Parks</surname> <given-names>M.</given-names></name> <name><surname>Gernandt</surname> <given-names>D. S.</given-names></name> <name><surname>Shen</surname> <given-names>R.</given-names></name> <name><surname>Mockler</surname> <given-names>T.</given-names></name></person-group> (<year>2008</year>). <article-title>Multiplex sequencing of plant chloroplast genomes using Solexa sequencing-by-synthesis technology</article-title>. <source>Nucleic Acids Res.</source> <volume>36</volume>:<fpage>e122</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkn502</pub-id><pub-id pub-id-type="pmid">18753151</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Curci</surname> <given-names>P. L.</given-names></name> <name><surname>De Paola</surname> <given-names>D.</given-names></name> <name><surname>Danzi</surname> <given-names>D.</given-names></name> <name><surname>Vendramin</surname> <given-names>G. G.</given-names></name> <name><surname>Sonnante</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>Complete chloroplast genome of the multifunctional crop globe artichoke and comparison with other Asteraceae</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e120589</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0120589</pub-id><pub-id pub-id-type="pmid">25774672</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Darling</surname> <given-names>A. C. E.</given-names></name> <name><surname>Mau</surname> <given-names>B.</given-names></name> <name><surname>Blattner</surname> <given-names>F. R.</given-names></name> <name><surname>Perna</surname> <given-names>N. T.</given-names></name></person-group> (<year>2004</year>). <article-title>Mauve: multiple alignment of conserved genomic sequence with rearrangements</article-title>. <source>Genome Res.</source> <volume>14</volume>, <fpage>1394</fpage>&#x02013;<lpage>1403</lpage>. <pub-id pub-id-type="doi">10.1101/gr.2289704</pub-id><pub-id pub-id-type="pmid">15231754</pub-id></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dhingra</surname> <given-names>A.</given-names></name> <name><surname>Folta</surname> <given-names>K. M.</given-names></name></person-group> (<year>2005</year>). <article-title>ASAP: amplification, sequencing &#x00026; annotation of plastomes</article-title>. <source>BMC Genomics</source> <volume>6</volume>:<fpage>176</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-6-176</pub-id><pub-id pub-id-type="pmid">16336644</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>W.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Yu</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Zhou</surname> <given-names>S.</given-names></name></person-group> (<year>2012</year>). <article-title>Highly variable chloroplast markers for evaluating plant phylogeny at low taxonomic levels and for DNA Barcoding</article-title>. <source>PLoS ONE</source> <volume>7</volume>:<fpage>e35071</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0035071</pub-id><pub-id pub-id-type="pmid">22511980</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doyle</surname> <given-names>J.</given-names></name> <name><surname>Ballenger</surname> <given-names>J. A.</given-names></name> <name><surname>Palmer</surname> <given-names>J.</given-names></name></person-group> (<year>1996</year>). <article-title>The distribution and phylogenetic significance of a 50-kb chloroplast DNA inversion in the flowering plant family Leguminosae</article-title>. <source>Mol. Phylogenet. Evol.</source> <volume>5</volume>, <fpage>429</fpage>&#x02013;<lpage>438</lpage>. <pub-id pub-id-type="doi">10.1006/mpev.1996.0038</pub-id><pub-id pub-id-type="pmid">8728401</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doyle</surname> <given-names>J. J.</given-names></name> <name><surname>Davis</surname> <given-names>J. I.</given-names></name> <name><surname>Soreng</surname> <given-names>R. J.</given-names></name> <name><surname>Garvin</surname> <given-names>D.</given-names></name> <name><surname>Anderson</surname> <given-names>M. J.</given-names></name></person-group> (<year>1992</year>). <article-title>Chloroplast DNA inversions and the origin of the grass family (Poaceae)</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>89</volume>, <fpage>7722</fpage>&#x02013;<lpage>7726</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.89.16.7722</pub-id><pub-id pub-id-type="pmid">1502190</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doyle</surname> <given-names>J. J.</given-names></name> <name><surname>Doyle</surname> <given-names>J. L.</given-names></name> <name><surname>Ballenger</surname> <given-names>J. A.</given-names></name> <name><surname>Dickson</surname> <given-names>E. E.</given-names></name> <name><surname>Kajita</surname> <given-names>T.</given-names></name> <name><surname>Ohashi</surname> <given-names>H.</given-names></name></person-group> (<year>1997</year>). <article-title>A phylogeny of the chloroplast gene rbcL in the leguminosae: Taxonomic correlations and insights into the evolution of nodulation</article-title>. <source>Am. J. Bot.</source> <volume>84</volume>, <fpage>541</fpage>&#x02013;<lpage>554</lpage>. <pub-id pub-id-type="doi">10.2307/2446030</pub-id><pub-id pub-id-type="pmid">21708606</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Doyle</surname> <given-names>J. J.</given-names></name> <name><surname>Doyle</surname> <given-names>J. L.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1995</year>). <article-title>Multiple Independent Losses of Two Genes and One Intron from Legume Chloroplast Genomes</article-title>. <source>Syst. Bot.</source> <volume>20</volume>, <fpage>272</fpage>&#x02013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.2307/2419496</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frazer</surname> <given-names>K. A.</given-names></name> <name><surname>Pachter</surname> <given-names>L.</given-names></name> <name><surname>Poliakov</surname> <given-names>A.</given-names></name> <name><surname>Rubin</surname> <given-names>E. M.</given-names></name> <name><surname>Dubchak</surname> <given-names>I.</given-names></name></person-group> (<year>2004</year>). <article-title>VISTA: computational tools for comparative genomics</article-title>. <source>Nucleic Acids Res.</source> <volume>32</volume>, <fpage>273</fpage>&#x02013;<lpage>279</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh458</pub-id><pub-id pub-id-type="pmid">15215394</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Freyer</surname> <given-names>R.</given-names></name> <name><surname>Kiefer-Meyer</surname> <given-names>M. C.</given-names></name> <name><surname>Kossel</surname> <given-names>H.</given-names></name></person-group> (<year>1997</year>). <article-title>Occurrence of plastid RNA editing in all major lineages of land plants</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>94</volume>, <fpage>6285</fpage>&#x02013;<lpage>6290</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.94.12.6285</pub-id><pub-id pub-id-type="pmid">9177209</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gantt</surname> <given-names>J. S.</given-names></name> <name><surname>Baldauf</surname> <given-names>S. L.</given-names></name> <name><surname>Calie</surname> <given-names>P. J.</given-names></name> <name><surname>Weeden</surname> <given-names>N. F.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1991</year>). <article-title>Transfer of rpl22 to the nucleus greatly preceded its loss from the chloroplast and involved the gain of an intron</article-title>. <source>EMBO J.</source> <volume>10</volume>, <fpage>3073</fpage>&#x02013;<lpage>3078</lpage>. <pub-id pub-id-type="pmid">1915281</pub-id></citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname> <given-names>X.</given-names></name> <name><surname>Castillo-Ram&#x000ED;rez</surname> <given-names>S.</given-names></name> <name><surname>Gonz&#x000E1;lez</surname> <given-names>V.</given-names></name> <name><surname>Bustos</surname> <given-names>P.</given-names></name> <name><surname>Fern&#x000E1;ndez-V&#x000E1;zquez</surname> <given-names>J. L.</given-names></name> <name><surname>Santamar&#x000ED;a</surname> <given-names>R. I.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Rapid evolutionary change of common bean (<italic>Phaseolus vulgaris</italic> L) plastome, and the genomic diversification of legume chloroplasts</article-title>. <source>BMC Genomics</source> <volume>8</volume>:<fpage>228</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-8-228</pub-id><pub-id pub-id-type="pmid">17623083</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hiratsuka</surname> <given-names>J.</given-names></name> <name><surname>Shimada</surname> <given-names>H.</given-names></name> <name><surname>Whittier</surname> <given-names>R.</given-names></name> <name><surname>Ishibashi</surname> <given-names>T.</given-names></name> <name><surname>Sakamoto</surname> <given-names>M.</given-names></name> <name><surname>Mori</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>1989</year>). <article-title>The complete sequence of the rice (<italic>Oryza sativa</italic>) chloroplast genome: intermolecular recombination between distinct tRNA genes accounts for a major plastid DNA inversion during the evolution of the cereals</article-title>. <source>MGG Mol. Gen. Genet.</source> <volume>217</volume>, <fpage>185</fpage>&#x02013;<lpage>194</lpage>. <pub-id pub-id-type="doi">10.1007/BF02464880</pub-id><pub-id pub-id-type="pmid">2770692</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hirose</surname> <given-names>T.</given-names></name> <name><surname>Fan</surname> <given-names>H.</given-names></name> <name><surname>Suzuki</surname> <given-names>J. Y.</given-names></name> <name><surname>Wakasugi</surname> <given-names>T.</given-names></name> <name><surname>Tsudzuki</surname> <given-names>T.</given-names></name> <name><surname>K&#x000F6;ssel</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>1996</year>). <article-title>Occurrence of silent RNA editing in chloroplasts: its species specificity and the influence of environmental and developmental conditions</article-title>. <source>Plant Mol. Biol.</source> <volume>30</volume>, <fpage>667</fpage>&#x02013;<lpage>672</lpage>. <pub-id pub-id-type="pmid">8605316</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hirose</surname> <given-names>T.</given-names></name> <name><surname>Kusumegi</surname> <given-names>T.</given-names></name> <name><surname>Tsudzuki</surname> <given-names>T.</given-names></name> <name><surname>Sugiura</surname> <given-names>M.</given-names></name></person-group> (<year>1999</year>). <article-title>RNA editing sites in tobacco chloroplast transcripts: editing as a possible regulator of chloroplast RNA polymerase activity</article-title>. <source>Mol. Gen. Genet.</source> <volume>262</volume>, <fpage>462</fpage>&#x02013;<lpage>467</lpage>. <pub-id pub-id-type="doi">10.1007/s004380051106</pub-id><pub-id pub-id-type="pmid">10589833</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>A. J.</given-names></name> <name><surname>Lavin</surname> <given-names>M.</given-names></name> <name><surname>Wojciechowski</surname> <given-names>M. F.</given-names></name> <name><surname>Sanderson</surname> <given-names>M. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Phylogenetic analysis of nuclear ribosomal ITS / 5. 8S sequences in the Tribe Millettieae (Fabaceae): Poecilanthe - Cyclolobium, the core Millettieae, and the Callerya Group</article-title>. <source>Syst. Bot.</source> <volume>27</volume>, <fpage>722</fpage>&#x02013;<lpage>733</lpage>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>H.</given-names></name> <name><surname>Shi</surname> <given-names>C.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Mao</surname> <given-names>S.</given-names></name> <name><surname>Gao</surname> <given-names>L.</given-names></name></person-group> (<year>2014</year>). <article-title>Thirteen Camellia chloroplast genome sequences determined by high-throughput sequencing : genome structure and phylogenetic relationships</article-title>. <source>BMC Evol. Biol.</source> <volume>14</volume>, <fpage>1</fpage>&#x02013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2148-14-151</pub-id><pub-id pub-id-type="pmid">25001059</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>Y. Y.</given-names></name> <name><surname>Matzke</surname> <given-names>A. J. M.</given-names></name> <name><surname>Matzke</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Complete sequence and comparative analysis of the chloroplast genome of coconut palm (<italic>Cocos nucifera</italic>)</article-title>. <source>PLoS ONE</source> <volume>8</volume>:<fpage>74736</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0074736</pub-id><pub-id pub-id-type="pmid">24023703</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iannacone</surname> <given-names>R.</given-names></name> <name><surname>Grieco</surname> <given-names>P. D.</given-names></name> <name><surname>Cellini</surname> <given-names>F.</given-names></name></person-group> (<year>1997</year>). <article-title>Specific sequence modifications of a cry3B endotoxin gene result in high levels of expression and insect resistance</article-title>. <source>Plant Mol. Biol.</source> <volume>34</volume>, <fpage>485</fpage>&#x02013;<lpage>496</lpage>. <pub-id pub-id-type="doi">10.1023/A:1005876323398</pub-id><pub-id pub-id-type="pmid">9225859</pub-id></citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Inada</surname> <given-names>M.</given-names></name> <name><surname>Sasaki</surname> <given-names>T.</given-names></name> <name><surname>Yukawa</surname> <given-names>M.</given-names></name> <name><surname>Tsudzuki</surname> <given-names>T.</given-names></name> <name><surname>Sugiura</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>A systematic search for RNA editing sites in pea chloroplasts: an editing event causes diversification from the evolutionarily conserved amino acid sequence</article-title>. <source>Plant Cell Physiol.</source> <volume>45</volume>, <fpage>1615</fpage>&#x02013;<lpage>1622</lpage>. <pub-id pub-id-type="doi">10.1093/pcp/pch191</pub-id><pub-id pub-id-type="pmid">15574837</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Cai</surname> <given-names>Z.</given-names></name> <name><surname>Raubeson</surname> <given-names>L. A.</given-names></name> <name><surname>Daniell</surname> <given-names>H.</given-names></name> <name><surname>Depamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Leebens-Mack</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Analysis of 81 genes from 64 plastid genomes resolves relationships in angiosperms and identifies genome-scale evolutionary patterns</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>104</volume>, <fpage>19369</fpage>&#x02013;<lpage>19374</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0709121104</pub-id><pub-id pub-id-type="pmid">18048330</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1987</year>). <article-title>A chloroplast DNA inversion marks an ancient evolutionary split in the sunflower family (Asteraceae)</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>84</volume>, <fpage>5818</fpage>&#x02013;<lpage>5822</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.84.16.5818</pub-id><pub-id pub-id-type="pmid">16593871</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Wojciechowski</surname> <given-names>M. F.</given-names></name> <name><surname>Sanniyasi</surname> <given-names>E.</given-names></name> <name><surname>Lee</surname> <given-names>S. B.</given-names></name> <name><surname>Daniell</surname> <given-names>H.</given-names></name></person-group> (<year>2008</year>). <article-title>Complete plastid genome sequence of the chickpea (<italic>Cicer arietinum</italic>) and the phylogenetic distribution of rps12 and clpP intron losses among legumes (Leguminosae)</article-title>. <source>Mol. Phylogenet. Evol.</source> <volume>48</volume>, <fpage>1204</fpage>&#x02013;<lpage>1217</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2008.06.013</pub-id><pub-id pub-id-type="pmid">18638561</pub-id></citation>
</ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kato</surname> <given-names>T.</given-names></name> <name><surname>Kaneko</surname> <given-names>T.</given-names></name> <name><surname>Sato</surname> <given-names>S.</given-names></name> <name><surname>Nakamura</surname> <given-names>Y.</given-names></name> <name><surname>Tabata</surname> <given-names>S.</given-names></name></person-group> (<year>2000</year>). <article-title>Complete structure of the chloroplast genome of a legume, <italic>Lotus japonicus</italic></article-title>. <source>DNA Res.</source> <volume>7</volume>, <fpage>323</fpage>&#x02013;<lpage>330</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/7.6.323</pub-id><pub-id pub-id-type="pmid">11214967</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khakhlova</surname> <given-names>O.</given-names></name> <name><surname>Bock</surname> <given-names>R.</given-names></name></person-group> (<year>2006</year>). <article-title>Elimination of deleterious mutations in plastid genomes by gene conversion</article-title>. <source>Plant J.</source> <volume>46</volume>, <fpage>85</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-313X.2006.02673.x</pub-id><pub-id pub-id-type="pmid">16553897</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kirti</surname> <given-names>P. B.</given-names></name> <name><surname>Narasimhulu</surname> <given-names>S. B.</given-names></name> <name><surname>Mohapatra</surname> <given-names>T.</given-names></name> <name><surname>Prakash</surname> <given-names>S.</given-names></name> <name><surname>Chopra</surname> <given-names>V. L.</given-names></name></person-group> (<year>1993</year>). <article-title>Correction of chlorophyll deficiency in alloplasmic male sterile Brassica juncea through recombination between chloroplast genomes</article-title>. <source>Genet. Res., Camb.</source> <volume>62</volume>, <fpage>11</fpage>&#x02013;<lpage>14</lpage>. <pub-id pub-id-type="doi">10.1017/S0016672300031505</pub-id></citation>
</ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koch</surname> <given-names>W.</given-names></name> <name><surname>Edwards</surname> <given-names>K.</given-names></name> <name><surname>K&#x000F6;ssel</surname> <given-names>H.</given-names></name></person-group> (<year>1981</year>). <article-title>Sequencing of the 16S-23S spacer in a ribosomal RNA operon of Zea mays chloroplast DNA reveals two split tRNA genes</article-title>. <source>Cell</source> <volume>25</volume>, <fpage>203</fpage>&#x02013;<lpage>213</lpage>. <pub-id pub-id-type="doi">10.1016/0092-8674(81)90245-2</pub-id><pub-id pub-id-type="pmid">7023695</pub-id></citation>
</ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lavin</surname> <given-names>M.</given-names></name> <name><surname>Doyle</surname> <given-names>J. J.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1990</year>). <article-title>Evolutionary significance of the loss of the Chloroplast-DNA inverted repeat in the leguminosae subfamily Papilionoideae</article-title>. <source>Evolution</source> <volume>44</volume>, <fpage>390</fpage>&#x02013;<lpage>402</lpage>. <pub-id pub-id-type="doi">10.2307/2409416</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>J.</given-names></name> <name><surname>Kang</surname> <given-names>Y.</given-names></name> <name><surname>Shin</surname> <given-names>S. C.</given-names></name> <name><surname>Park</surname> <given-names>H.</given-names></name> <name><surname>Lee</surname> <given-names>H.</given-names></name></person-group> (<year>2014</year>). <article-title>Combined analysis of the chloroplast genome and transcriptome of the antarctic vascular plant deschampsia antarctica desv</article-title>. <source>PLoS ONE</source> <volume>9</volume>:<fpage>e92501</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0092501</pub-id><pub-id pub-id-type="pmid">24647560</pub-id></citation>
</ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>Y.</given-names></name> <name><surname>Henry</surname> <given-names>R. J.</given-names></name> <name><surname>Rossetto</surname> <given-names>M.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Plant DNA barcoding: from gene to genome</article-title>. <source>Biol. Rev.</source> <volume>90</volume>, <fpage>157</fpage>&#x02013;<lpage>166</lpage>. <pub-id pub-id-type="doi">10.1111/brv.12104</pub-id><pub-id pub-id-type="pmid">24666563</pub-id></citation>
</ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lin</surname> <given-names>C. P.</given-names></name> <name><surname>Ko</surname> <given-names>C. Y.</given-names></name> <name><surname>Kuo</surname> <given-names>C. I.</given-names></name> <name><surname>Liu</surname> <given-names>M. S.</given-names></name> <name><surname>Schafleitner</surname> <given-names>R.</given-names></name> <name><surname>Chen</surname> <given-names>L. F. O.</given-names></name></person-group> (<year>2015</year>). <article-title>Transcriptional slippage and RNA editing increase the diversity of transcripts in chloroplasts: insight from deep sequencing of <italic>Vigna radiata</italic> genome and transcriptome</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e129396</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0129396</pub-id><pub-id pub-id-type="pmid">26076132</pub-id></citation>
</ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lowe</surname> <given-names>T. M.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>1997</year>). <article-title>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence</article-title>. <source>Nucleic Acids Res.</source> <volume>25</volume>, <fpage>955</fpage>&#x02013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1093/nar/25.5.955</pub-id><pub-id pub-id-type="pmid">9023104</pub-id></citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lutz</surname> <given-names>K. A.</given-names></name> <name><surname>Maliga</surname> <given-names>P.</given-names></name></person-group> (<year>2001</year>). <article-title>Lack of conservation of editing sites in mRNAs that encode subunits of the NAD(P)H dehydrogenase complex in plastids and mitochondria of <italic>Arabidopsis thaliana</italic></article-title>. <source>Curr. Genet.</source> <volume>40</volume>, <fpage>214</fpage>&#x02013;<lpage>219</lpage>. <pub-id pub-id-type="doi">10.1007/s002940100242</pub-id><pub-id pub-id-type="pmid">11727998</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Magee</surname> <given-names>A. M.</given-names></name> <name><surname>Aspinall</surname> <given-names>S.</given-names></name> <name><surname>Rice</surname> <given-names>D. W.</given-names></name> <name><surname>Cusack</surname> <given-names>B. P.</given-names></name> <name><surname>S&#x000E9;mon</surname> <given-names>M.</given-names></name> <name><surname>Perry</surname> <given-names>A. S.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Localized hypermutation and associated gene losses in legume chloroplast genomes</article-title>. <source>Genome Res.</source> <volume>20</volume>, <fpage>1700</fpage>&#x02013;<lpage>1710</lpage>. <pub-id pub-id-type="doi">10.1101/gr.111955.110</pub-id><pub-id pub-id-type="pmid">20978141</pub-id></citation>
</ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maier</surname> <given-names>R. M.</given-names></name> <name><surname>Neckermann</surname> <given-names>K.</given-names></name> <name><surname>Igloi</surname> <given-names>G. L.</given-names></name> <name><surname>K&#x000F6;ssel</surname> <given-names>H.</given-names></name></person-group> (<year>1995</year>). <article-title>Complete sequence of the maize chloroplast genome: gene content, hotspots of divergence and fine tuning of genetic information by transcript editing</article-title>. <source>J. Mol. Biol.</source> <volume>251</volume>, <fpage>614</fpage>&#x02013;<lpage>628</lpage>. <pub-id pub-id-type="doi">10.1006/jmbi.1995.0460</pub-id><pub-id pub-id-type="pmid">7666415</pub-id></citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maier</surname> <given-names>R. M.</given-names></name> <name><surname>Zeltz</surname> <given-names>P.</given-names></name> <name><surname>K&#x000F6;ssel</surname> <given-names>H.</given-names></name> <name><surname>Bonnard</surname> <given-names>G.</given-names></name> <name><surname>Gualberto</surname> <given-names>J. M.</given-names></name> <name><surname>Grienenberger</surname> <given-names>J. M.</given-names></name></person-group> (<year>1996</year>). <article-title>RNA editing in plant mitochondria and chloroplasts</article-title>. <source>Plant Mol. Biol.</source> <volume>32</volume>, <fpage>343</fpage>&#x02013;<lpage>365</lpage>. <pub-id pub-id-type="doi">10.1007/BF00039390</pub-id><pub-id pub-id-type="pmid">8980487</pub-id></citation>
</ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mariotti</surname> <given-names>R.</given-names></name> <name><surname>Cultrera</surname> <given-names>N. G. M.</given-names></name> <name><surname>D&#x000ED;ez</surname> <given-names>C. M.</given-names></name> <name><surname>Baldoni</surname> <given-names>L.</given-names></name> <name><surname>Rubini</surname> <given-names>A.</given-names></name></person-group> (<year>2010</year>). <article-title>Identification of new polymorphic regions and differentiation of cultivated olives (<italic>Olea europaea</italic> L.) through plastome sequence comparison</article-title>. <source>BMC Plant Biol.</source> <volume>10</volume>:<fpage>211</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2229-10-211</pub-id><pub-id pub-id-type="pmid">20868482</pub-id></citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname> <given-names>G. E.</given-names></name> <name><surname>Rousseau-Gueutin</surname> <given-names>M.</given-names></name> <name><surname>Cordonnier</surname> <given-names>S.</given-names></name> <name><surname>Lima</surname> <given-names>O.</given-names></name> <name><surname>Michon-Coudouel</surname> <given-names>S.</given-names></name> <name><surname>Naquin</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>The first complete chloroplast genome of the Genistoid legume Lupinus luteus: evidence for a novel major lineage-specific rearrangement and new insights regarding plastome evolution in the legume family</article-title>. <source>Ann. Bot.</source> <volume>113</volume>, <fpage>1197</fpage>&#x02013;<lpage>1210</lpage>. <pub-id pub-id-type="doi">10.1093/aob/mcu050</pub-id><pub-id pub-id-type="pmid">24769537</pub-id></citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Millen</surname> <given-names>R. S.</given-names></name> <name><surname>Olmstead</surname> <given-names>R. G.</given-names></name> <name><surname>Adams</surname> <given-names>K. L.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Lao</surname> <given-names>N. T.</given-names></name> <name><surname>Heggie</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2001</year>). <article-title>Many parallel losses of infA from chloroplast DNA during Angiosperm evolution with multiple independent transfers to the nucleus</article-title>. <source>Plant Cell</source> <volume>13</volume>, <fpage>645</fpage>&#x02013;<lpage>658</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.13.3.645</pub-id><pub-id pub-id-type="pmid">11251102</pub-id></citation>
</ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moore</surname> <given-names>M. J.</given-names></name> <name><surname>Dhingra</surname> <given-names>A.</given-names></name> <name><surname>Soltis</surname> <given-names>P. S.</given-names></name> <name><surname>Shaw</surname> <given-names>R.</given-names></name> <name><surname>Farmerie</surname> <given-names>W. G.</given-names></name> <name><surname>Folta</surname> <given-names>K. M.</given-names></name> <etal/></person-group>. (<year>2006</year>). <article-title>Rapid and accurate pyrosequencing of angiosperm plastid genomes</article-title>. <source>BMC Plant Biol.</source> <volume>6</volume>:<fpage>17</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2229-6-17</pub-id><pub-id pub-id-type="pmid">16934154</pub-id></citation>
</ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morton</surname> <given-names>B. R.</given-names></name></person-group> (<year>2003</year>). <article-title>The role of context-dependent mutations in generating compositional and codon usage bias in grass chloroplast DNA</article-title>. <source>J. Mol. Evol.</source> <volume>56</volume>, <fpage>616</fpage>&#x02013;<lpage>629</lpage>. <pub-id pub-id-type="doi">10.1007/s00239-002-2430-1</pub-id><pub-id pub-id-type="pmid">12698298</pub-id></citation>
</ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mower</surname> <given-names>J. P.</given-names></name></person-group> (<year>2009</year>). <article-title>The PREP suite: predictive RNA editors for plant mitochondrial genes, chloroplast genes and user-defined alignments</article-title>. <source>Nucleic Acids Res.</source> <volume>37</volume>, <fpage>W253</fpage>&#x02013;<lpage>W259</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkp337</pub-id><pub-id pub-id-type="pmid">19433507</pub-id></citation>
</ref>
<ref id="B52">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nagano</surname> <given-names>Y.</given-names></name> <name><surname>Matsuno</surname> <given-names>R.</given-names></name> <name><surname>Sasaki</surname> <given-names>Y.</given-names></name></person-group> (<year>1991</year>). <article-title>Sequence and transcriptional analysis of the gene cluster trnQ-zfpA-psaI-orf231-petA in pea chloroplasts</article-title>. <source>Curr. Genet.</source> <volume>20</volume>, <fpage>431</fpage>&#x02013;<lpage>436</lpage>. <pub-id pub-id-type="doi">10.1007/BF00317074</pub-id><pub-id pub-id-type="pmid">1807835</pub-id></citation>
</ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ohyama</surname> <given-names>K.</given-names></name> <name><surname>Fukuzawa</surname> <given-names>H.</given-names></name> <name><surname>Kohchi</surname> <given-names>T.</given-names></name> <name><surname>Shirai</surname> <given-names>H.</given-names></name> <name><surname>Sano</surname> <given-names>T.</given-names></name> <name><surname>Sano</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>1986</year>). <article-title>Chloroplast gene organization deduced from complete sequence of liverwort <italic>Marchantia polymorpha</italic> chloroplast DNA</article-title>. <source>Nature</source> <volume>322</volume>, <fpage>572</fpage>&#x02013;<lpage>574</lpage>. <pub-id pub-id-type="doi">10.1038/322572a0</pub-id></citation>
</ref>
<ref id="B54">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olmstead</surname> <given-names>R. G.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1994</year>). <article-title>Chloroplast DNA systematics : a review of methods and data analysis</article-title>. <source>Am. J. Bot.</source> <volume>81</volume>, <fpage>1205</fpage>&#x02013;<lpage>1224</lpage>. <pub-id pub-id-type="doi">10.2307/2445483</pub-id></citation>
</ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozyigit</surname> <given-names>I. I.</given-names></name> <name><surname>Dogan</surname> <given-names>I.</given-names></name> <name><surname>Filiz</surname> <given-names>E.</given-names></name></person-group> (<year>2015</year>). <article-title><italic>In silico</italic> analysis of simple sequence repeats (SSRs) in chloroplast genomes of Glycine species</article-title>. <source>Plant Omics J.</source> <volume>8</volume>, <fpage>24</fpage>&#x02013;<lpage>29</lpage>.</citation>
</ref>
<ref id="B56">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1983</year>). <article-title>Chloroplast DNA exists in two orientations</article-title>. <source>Nature</source> <volume>301</volume>, <fpage>92</fpage>&#x02013;<lpage>93</lpage>. <pub-id pub-id-type="doi">10.1038/301092a0</pub-id></citation>
</ref>
<ref id="B57">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1991</year>). <article-title>Plastid chromosomes: structure and evolution</article-title>, in <source>Molecular Biology of Plastids</source>, ed <person-group person-group-type="editor"><name><surname>Bogorad</surname> <given-names>L.</given-names></name></person-group>(<publisher-loc>San Diego, CA</publisher-loc>: <publisher-name>Academic Press</publisher-name>), <fpage>5</fpage>&#x02013;<lpage>53</lpage>.</citation>
</ref>
<ref id="B58">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Osorio</surname> <given-names>B.</given-names></name> <name><surname>Aldrich</surname> <given-names>J.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1987</year>). <article-title>Chloroplast DNA evolution among legumes: loss of a large inverted repeat occurred prior to other sequence rearrangements</article-title>. <source>Curr. Genet.</source> <volume>11</volume>, <fpage>275</fpage>&#x02013;<lpage>286</lpage>. <pub-id pub-id-type="doi">10.1007/BF00355401</pub-id></citation>
</ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Osorio</surname> <given-names>B.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1988</year>). <article-title>Evolutionary significance of inversions in legume chloroplast DNAs</article-title>. <source>Curr. Genet.</source> <volume>14</volume>, <fpage>65</fpage>&#x02013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1007/BF00405856</pub-id></citation>
</ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1981</year>). <article-title>Rearrangements in the chloroplast genomes of mung bean and pea</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>78</volume>, <fpage>5533</fpage>&#x02013;<lpage>5537</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.78.9.5533</pub-id><pub-id pub-id-type="pmid">16593087</pub-id></citation>
</ref>
<ref id="B61">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1982</year>). <article-title>Chloroplast DNA rearrangements are more frequent when a large inverted repeat sequence is lost</article-title>. <source>Cell</source> <volume>29</volume>, <fpage>537</fpage>&#x02013;<lpage>550</lpage>. <pub-id pub-id-type="doi">10.1016/0092-8674(82)90170-2</pub-id><pub-id pub-id-type="pmid">6288261</pub-id></citation>
</ref>
<ref id="B62">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pennington</surname> <given-names>R.</given-names></name> <name><surname>Lavin</surname> <given-names>M.</given-names></name> <name><surname>Ireland</surname> <given-names>H.</given-names></name> <name><surname>Klitgaard</surname> <given-names>B.</given-names></name> <name><surname>Preston</surname> <given-names>J.</given-names></name> <name><surname>Hu</surname> <given-names>J.-M.</given-names></name></person-group> (<year>2001</year>). <article-title>Phylogenetic relationships of basal Papilionoid legumes based upon sequences of the chloroplast trnL intron</article-title>. <source>Syst. Bot.</source> <volume>26</volume>, <fpage>537</fpage>&#x02013;<lpage>556</lpage>. <pub-id pub-id-type="doi">10.1043/0363-6445-26.3.537</pub-id></citation>
</ref>
<ref id="B63">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Perry</surname> <given-names>A. S.</given-names></name> <name><surname>Wolfe</surname> <given-names>K. H.</given-names></name></person-group> (<year>2002</year>). <article-title>Nucleotide substitution rates in legume chloroplast DNA depend on the presence of the inverted repeat</article-title>. <source>J. Mol. Evol.</source> <volume>55</volume>, <fpage>501</fpage>&#x02013;<lpage>508</lpage>. <pub-id pub-id-type="doi">10.1007/s00239-002-2333-y</pub-id><pub-id pub-id-type="pmid">12399924</pub-id></citation>
</ref>
<ref id="B64">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Powell</surname> <given-names>W.</given-names></name> <name><surname>Morgante</surname> <given-names>M.</given-names></name> <name><surname>McDevitt</surname> <given-names>R.</given-names></name> <name><surname>Vendramin</surname> <given-names>G. G.</given-names></name> <name><surname>Rafalski</surname> <given-names>J. A.</given-names></name></person-group> (<year>1995</year>). <article-title>Polymorphic simple sequence repeat regions in chloroplast genomes: applications to the population genetics of pines</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>92</volume>, <fpage>7759</fpage>&#x02013;<lpage>7763</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.92.17.7759</pub-id><pub-id pub-id-type="pmid">7644491</pub-id></citation>
</ref>
<ref id="B65">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Provan</surname> <given-names>J.</given-names></name> <name><surname>Powell</surname> <given-names>W.</given-names></name> <name><surname>Hollingsworth</surname> <given-names>P. M.</given-names></name></person-group> (<year>2001</year>). <article-title>Chloroplast microsatellites: new tools for studies in plant ecology and evolution</article-title>. <source>Trends Ecol. Evol.</source> <volume>16</volume>, <fpage>142</fpage>&#x02013;<lpage>147</lpage>. <pub-id pub-id-type="doi">10.1016/S0169-5347(00)02097-8</pub-id><pub-id pub-id-type="pmid">11179578</pub-id></citation>
</ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rajendrakumar</surname> <given-names>P.</given-names></name> <name><surname>Biswal</surname> <given-names>A. K.</given-names></name> <name><surname>Balachandran</surname> <given-names>S. M.</given-names></name> <name><surname>Srinivasarao</surname> <given-names>K.</given-names></name> <name><surname>Sundaram</surname> <given-names>R. M.</given-names></name></person-group> (<year>2007</year>). <article-title>Simple sequence repeats in organellar genomes of rice: frequency and distribution in genic and intergenic regions</article-title>. <source>Bioinformatics</source> <volume>23</volume>, <fpage>1</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl547</pub-id><pub-id pub-id-type="pmid">17077096</pub-id></citation>
</ref>
<ref id="B67">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raman</surname> <given-names>G.</given-names></name> <name><surname>Park</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Analysis of the complete chloroplast genome of a medicinal plant, Dianthus superbus var. longicalyncinus, from a comparative genomics perspective</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e141329</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0141329</pub-id><pub-id pub-id-type="pmid">26513163</pub-id></citation>
</ref>
<ref id="B68">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Raubeson</surname> <given-names>L. A.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name></person-group> (<year>2005</year>). <article-title>Chloroplast genomes of plants</article-title>, in <source>Plant Diversity and Evolution: Genotypic and Phenotypic Variation in Higher Plants,</source> ed. R. J. Henry (<publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>CABI</publisher-name>), <fpage>45</fpage>&#x02013;<lpage>68</lpage>.</citation>
</ref>
<ref id="B69">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raubeson</surname> <given-names>L. A.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name></person-group> (<year>1992</year>). <article-title>Chloroplast DNA evidence on the ancient evolutionary split in vascular land plants</article-title>. <source>Science</source> <volume>255</volume>, <fpage>1697</fpage>&#x02013;<lpage>1699</lpage>. <pub-id pub-id-type="doi">10.1126/science.255.5052.1697</pub-id><pub-id pub-id-type="pmid">17749424</pub-id></citation>
</ref>
<ref id="B70">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Redwan</surname> <given-names>R. M.</given-names></name> <name><surname>Saidin</surname> <given-names>A.</given-names></name> <name><surname>Kumar</surname> <given-names>S. V.</given-names></name></person-group> (<year>2015</year>). <article-title>Complete chloroplast genome sequence of MD-2 pineapple and its comparative analysis among nine other plants from the subclass Commelinidae</article-title>. <source>BMC Plant Biol.</source> <volume>15</volume>:<fpage>196</fpage>. <pub-id pub-id-type="doi">10.1186/s12870-015-0587-1</pub-id><pub-id pub-id-type="pmid">26683477</pub-id></citation>
</ref>
<ref id="B71">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rouwendal</surname> <given-names>G. J. A.</given-names></name> <name><surname>Mendes</surname> <given-names>O.</given-names></name> <name><surname>Wolbert</surname> <given-names>E. J. H.</given-names></name> <name><surname>de Boer</surname> <given-names>A. D.</given-names></name></person-group> (<year>1997</year>). <article-title>Enhanced expression in tobacco of the gene encoding green fluorescent protein by modification of its codon usage</article-title>. <source>Plant Mol. Biol.</source> <volume>33</volume>, <fpage>989</fpage>&#x02013;<lpage>999</lpage>. <pub-id pub-id-type="doi">10.1023/A:1005740823703</pub-id><pub-id pub-id-type="pmid">9154981</pub-id></citation>
</ref>
<ref id="B72">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sabir</surname> <given-names>J.</given-names></name> <name><surname>Schwarz</surname> <given-names>E.</given-names></name> <name><surname>Ellison</surname> <given-names>N.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Baeshen</surname> <given-names>N. A.</given-names></name> <name><surname>Mutwakil</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Evolutionary and biotechnology implications of plastid genome variation in the inverted-repeat-lacking clade of legumes</article-title>. <source>Plant Biotechnol. J.</source> <volume>12</volume>, <fpage>743</fpage>&#x02013;<lpage>754</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.12179</pub-id><pub-id pub-id-type="pmid">24618204</pub-id></citation>
</ref>
<ref id="B73">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saski</surname> <given-names>C.</given-names></name> <name><surname>Lee</surname> <given-names>S. B.</given-names></name> <name><surname>Daniell</surname> <given-names>H.</given-names></name> <name><surname>Wood</surname> <given-names>T. C.</given-names></name> <name><surname>Tomkins</surname> <given-names>J.</given-names></name> <name><surname>Kim</surname> <given-names>H. G.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>Complete chloroplast genome sequence of <italic>Glycine max</italic> and comparative analyses with other legume genomes</article-title>. <source>Plant Mol. Biol.</source> <volume>59</volume>, <fpage>309</fpage>&#x02013;<lpage>322</lpage>. <pub-id pub-id-type="doi">10.1007/s11103-005-8882-0</pub-id><pub-id pub-id-type="pmid">16247559</pub-id></citation>
</ref>
<ref id="B74">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sato</surname> <given-names>S.</given-names></name> <name><surname>Nakamura</surname> <given-names>Y.</given-names></name> <name><surname>Kaneko</surname> <given-names>T.</given-names></name> <name><surname>Asamizu</surname> <given-names>E.</given-names></name> <name><surname>Tabata</surname> <given-names>S.</given-names></name></person-group> (<year>1999</year>). <article-title>Complete structure of the chloroplast genome of thaliana ssc</article-title>. <source>DNA Res.</source> <volume>6</volume>, <fpage>283</fpage>&#x02013;<lpage>290</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/6.5.283</pub-id><pub-id pub-id-type="pmid">10574454</pub-id></citation>
</ref>
<ref id="B75">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schl&#x000F6;tterer</surname> <given-names>C.</given-names></name></person-group> (<year>2000</year>). <article-title>Evolutionary dynamics of microsatellite DNA</article-title>. <source>Chromosoma</source> <volume>109</volume>, <fpage>365</fpage>&#x02013;<lpage>371</lpage>. <pub-id pub-id-type="doi">10.1007/s004120000089</pub-id><pub-id pub-id-type="pmid">11072791</pub-id></citation>
</ref>
<ref id="B76">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schmieder</surname> <given-names>R.</given-names></name> <name><surname>Edwards</surname> <given-names>R.</given-names></name></person-group> (<year>2011</year>). <article-title>Quality control and preprocessing of metagenomic datasets</article-title>. <source>Bioinformatics</source> <volume>27</volume>, <fpage>863</fpage>&#x02013;<lpage>864</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr026</pub-id><pub-id pub-id-type="pmid">21278185</pub-id></citation>
</ref>
<ref id="B77">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>D.</given-names></name> <name><surname>Green</surname> <given-names>J. M.</given-names></name></person-group> (<year>1980</year>). <article-title>Pigeonpea</article-title>, in <source>Hybridization of Crop Plants</source>, eds <person-group person-group-type="editor"><name><surname>Fehr</surname> <given-names>W. R.</given-names></name> <name><surname>Hadley</surname> <given-names>H. H.</given-names></name></person-group>(<publisher-loc>Madison, WI</publisher-loc>: <publisher-name>American Society of Agronomy and Crop Science Society of America</publisher-name>), <fpage>471</fpage>&#x02013;<lpage>481</lpage>.</citation>
</ref>
<ref id="B78">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shikanai</surname> <given-names>T.</given-names></name> <name><surname>Endo</surname> <given-names>T.</given-names></name> <name><surname>Hashimoto</surname> <given-names>T.</given-names></name> <name><surname>Yamada</surname> <given-names>Y.</given-names></name> <name><surname>Asada</surname> <given-names>K.</given-names></name> <name><surname>Yokota</surname> <given-names>A.</given-names></name></person-group> (<year>1998</year>). <article-title>Directed disruption of the tobacco ndhB gene impairs cyclic electron flow around photosystem I</article-title>. <source>Proc. Natl. Acad. Sci. U. S.A.</source> <volume>95</volume>, <fpage>9705</fpage>&#x02013;<lpage>9709</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.95.16.9705</pub-id><pub-id pub-id-type="pmid">9689145</pub-id></citation>
</ref>
<ref id="B79">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shinozaki</surname> <given-names>K.</given-names></name> <name><surname>Ohme</surname> <given-names>M.</given-names></name> <name><surname>Tanaka</surname> <given-names>M.</given-names></name> <name><surname>Wakasugi</surname> <given-names>T.</given-names></name> <name><surname>Hayashida</surname> <given-names>N.</given-names></name> <name><surname>Matsubayashi</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>1986</year>). <article-title>The complete nucleotide sequence of the tobacco chloroplast genome: its gene organization and expression</article-title>. <source>EMBO J.</source> <volume>5</volume>, <fpage>2043</fpage>&#x02013;<lpage>2049</lpage>. <pub-id pub-id-type="pmid">16453699</pub-id></citation>
</ref>
<ref id="B80">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>N. K.</given-names></name> <name><surname>Gupta</surname> <given-names>D. K.</given-names></name> <name><surname>Jayaswal</surname> <given-names>P. K.</given-names></name> <name><surname>Mahato</surname> <given-names>A. K.</given-names></name> <name><surname>Dutta</surname> <given-names>S.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>The first draft of the pigeonpea genome sequence</article-title>. <source>J. Plant Biochem. Biotechnol.</source> <volume>21</volume>, <fpage>98</fpage>&#x02013;<lpage>112</lpage>. <pub-id pub-id-type="doi">10.1007/s13562-011-0088-8</pub-id><pub-id pub-id-type="pmid">24431589</pub-id></citation>
</ref>
<ref id="B81">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>A. G.</given-names></name> <name><surname>Wilson</surname> <given-names>R. M.</given-names></name> <name><surname>Kaethner</surname> <given-names>T. M.</given-names></name> <name><surname>Willey</surname> <given-names>D. L.</given-names></name> <name><surname>Gray</surname> <given-names>J. C.</given-names></name></person-group> (<year>1991</year>). <article-title>Pea chloroplast genes encoding a 4kDa polypeptide of photosystem I and a putative enzyme of C1 metabolism</article-title>. <source>Curr. Genet.</source> <volume>19</volume>, <fpage>403</fpage>&#x02013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.1007/BF00309603</pub-id><pub-id pub-id-type="pmid">1913879</pub-id></citation>
</ref>
<ref id="B82">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tangphatsornruang</surname> <given-names>S.</given-names></name> <name><surname>Sangsrakru</surname> <given-names>D.</given-names></name> <name><surname>Chanprasert</surname> <given-names>J.</given-names></name> <name><surname>Uthaipaisanwong</surname> <given-names>P.</given-names></name> <name><surname>Yoocha</surname> <given-names>T.</given-names></name> <name><surname>Jomchai</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>The chloroplast genome sequence of mungbean (<italic>Vigna radiata</italic>) determined by high-throughput pyrosequencing: structural organization and phylogenetic relationships</article-title>. <source>DNA Res.</source> <volume>17</volume>, <fpage>11</fpage>&#x02013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/dsp025</pub-id><pub-id pub-id-type="pmid">20007682</pub-id></citation>
</ref>
<ref id="B83">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thomas</surname> <given-names>F.</given-names></name> <name><surname>Massenet</surname> <given-names>O.</given-names></name> <name><surname>Dorne</surname> <given-names>A. M.</given-names></name> <name><surname>Briat</surname> <given-names>J. M. R.</given-names></name></person-group> (<year>1988</year>). <article-title>Expression of the rpl23, rpl2, and rps19 genes in spinach chloroplasts</article-title>. <source>Nucleic Acids Res.</source> <volume>16</volume>, <fpage>2461</fpage>&#x02013;<lpage>2472</lpage>. <pub-id pub-id-type="doi">10.1093/nar/16.6.2461</pub-id><pub-id pub-id-type="pmid">3362671</pub-id></citation>
</ref>
<ref id="B84">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsudzuki</surname> <given-names>J.</given-names></name> <name><surname>Ito</surname> <given-names>S.</given-names></name> <name><surname>Tsudzuki</surname> <given-names>T.</given-names></name> <name><surname>Wakasugi</surname> <given-names>T.</given-names></name> <name><surname>Sugiura</surname> <given-names>M.</given-names></name></person-group> (<year>1994</year>). <article-title>A new gene encoding tRNA (Pro) (GGG) is present in the chloroplast genome of black pine: a compilation of 32 tRNA genes from black pine chloroplasts</article-title>. <source>Curr Genet.</source> <volume>26</volume>, <fpage>153</fpage>&#x02013;<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1007/BF00313804</pub-id><pub-id pub-id-type="pmid">8001170</pub-id></citation>
</ref>
<ref id="B85">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tuteja</surname> <given-names>R.</given-names></name> <name><surname>Saxena</surname> <given-names>R. K.</given-names></name> <name><surname>Davila</surname> <given-names>J.</given-names></name> <name><surname>Shah</surname> <given-names>T.</given-names></name> <name><surname>Chen</surname> <given-names>W.</given-names></name> <name><surname>Xiao</surname> <given-names>Y. L.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Cytoplasmic male sterility-associated chimeric open reading frames identified by mitochondrial genome sequencing of four cajanus genotypes</article-title>. <source>DNA Res.</source> <volume>20</volume>, <fpage>485</fpage>&#x02013;<lpage>495</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/dst025</pub-id><pub-id pub-id-type="pmid">23792890</pub-id></citation>
</ref>
<ref id="B86">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ueda</surname> <given-names>M.</given-names></name> <name><surname>Nishikawa</surname> <given-names>T.</given-names></name> <name><surname>Fujimoto</surname> <given-names>M.</given-names></name> <name><surname>Takanashi</surname> <given-names>H.</given-names></name> <name><surname>Arimura</surname> <given-names>S. I.</given-names></name> <name><surname>Tsutsumi</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>Substitution of the gene for chloroplast RPS16 was assisted by generation of a dual targeting signal</article-title>. <source>Mol. Biol. Evol.</source> <volume>25</volume>, <fpage>1566</fpage>&#x02013;<lpage>1575</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msn102</pub-id><pub-id pub-id-type="pmid">18453549</pub-id></citation>
</ref>
<ref id="B87">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Varshney</surname> <given-names>R. K.</given-names></name> <name><surname>Chen</surname> <given-names>W.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Bharti</surname> <given-names>A. K.</given-names></name> <name><surname>Saxena</surname> <given-names>R. K.</given-names></name> <name><surname>Schlueter</surname> <given-names>J. A.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Draft genome sequence of pigeonpea (<italic>Cajanus cajan</italic>), an orphan legume crop of resource-poor farmers</article-title>. <source>Nat. Biotechnol.</source> <volume>30</volume>, <fpage>83</fpage>&#x02013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.2022</pub-id><pub-id pub-id-type="pmid">22057054</pub-id></citation>
</ref>
<ref id="B88">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wakasugi</surname> <given-names>T.</given-names></name> <name><surname>Nagai</surname> <given-names>T.</given-names></name> <name><surname>Kapoor</surname> <given-names>M.</given-names></name> <name><surname>Sugita</surname> <given-names>M.</given-names></name> <name><surname>Ito</surname> <given-names>M.</given-names></name> <name><surname>Ito</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>1997</year>). <article-title>Complete nucleotide sequence of the chloroplast genome from the green alga <italic>Chlorella vulgaris</italic>: the existence of genes possibly involved in chloroplast division</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>94</volume>, <fpage>5967</fpage>&#x02013;<lpage>5972</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.94.11.5967</pub-id><pub-id pub-id-type="pmid">9159184</pub-id></citation>
</ref>
<ref id="B89">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wheeler</surname> <given-names>G. L.</given-names></name> <name><surname>Dorman</surname> <given-names>H. E.</given-names></name> <name><surname>Buchanan</surname> <given-names>A.</given-names></name> <name><surname>Challagundla</surname> <given-names>L.</given-names></name> <name><surname>Wallace</surname> <given-names>L. E.</given-names></name></person-group> (<year>2014</year>). <article-title>A review of the prevalence, utility, and caveats of using chloroplast simple sequence repeats for studies of plant biology</article-title>. <source>Appl. Plant Sci.</source> <volume>2</volume>:<fpage>1400059</fpage>. <pub-id pub-id-type="doi">10.3732/apps.1400059</pub-id><pub-id pub-id-type="pmid">25506520</pub-id></citation>
</ref>
<ref id="B90">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Williams</surname> <given-names>A. V.</given-names></name> <name><surname>Boykin</surname> <given-names>L. M.</given-names></name> <name><surname>Howell</surname> <given-names>K. A.</given-names></name> <name><surname>Nevill</surname> <given-names>P. G.</given-names></name> <name><surname>Small</surname> <given-names>I.</given-names></name></person-group> (<year>2015</year>). <article-title>The complete sequence of the <italic>Acacia ligulata</italic> chloroplast genome reveals a highly divergent clpP1 gene</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e0125768</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0125768</pub-id><pub-id pub-id-type="pmid">26367530</pub-id></citation>
</ref>
<ref id="B91">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wojciechowski</surname> <given-names>M. F.</given-names></name> <name><surname>Lavin</surname> <given-names>M.</given-names></name> <name><surname>Sanderson</surname> <given-names>M. J.</given-names></name></person-group> (<year>2004</year>). <article-title>A phylogeny of legumes (Leguminosae) based on analysis of the plastid matK gene resolves many well-supported subclades within the family</article-title>. <source>Am. J. Bot.</source> <volume>91</volume>, <fpage>1846</fpage>&#x02013;<lpage>1862</lpage>. <pub-id pub-id-type="doi">10.3732/ajb.91.11.1846</pub-id><pub-id pub-id-type="pmid">21652332</pub-id></citation>
</ref>
<ref id="B92">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wojciechowski</surname> <given-names>M. F.</given-names></name> <name><surname>Sanderson</surname> <given-names>M. J.</given-names></name> <name><surname>Steele</surname> <given-names>K. P.</given-names></name> <name><surname>Liston</surname> <given-names>A.</given-names></name></person-group> (<year>2000</year>). <article-title>Molecular phylogeny of the &#x0201C;Temperate Herbaceous Tribes&#x0201D; of papilionoid legumes: a supertree approach</article-title>. <source>Adv. Legum. Syst.</source> <volume>9</volume>, <fpage>277</fpage>&#x02013;<lpage>298</lpage>.</citation>
</ref>
<ref id="B93">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wolfe</surname> <given-names>K. H.</given-names></name> <name><surname>Morden</surname> <given-names>C. W.</given-names></name> <name><surname>Palmer</surname> <given-names>J. D.</given-names></name></person-group> (<year>1992</year>). <article-title>Function and evolution of a minimal plastid genome from a nonphotosynthetic parasitic plant</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>89</volume>, <fpage>10648</fpage>&#x02013;<lpage>10652</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.89.22.10648</pub-id><pub-id pub-id-type="pmid">1332054</pub-id></citation>
</ref>
<ref id="B94">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wyman</surname> <given-names>S. K.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Boore</surname> <given-names>J. L.</given-names></name></person-group> (<year>2004</year>). <article-title>Automatic annotation of organellar genomes with DOGMA</article-title>. <source>Bioinformatics</source> <volume>20</volume>, <fpage>3252</fpage>&#x02013;<lpage>3255</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bth352</pub-id><pub-id pub-id-type="pmid">15180927</pub-id></citation>
</ref>
<ref id="B95">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Feng</surname> <given-names>D.</given-names></name> <name><surname>Song</surname> <given-names>G.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Wu</surname> <given-names>X.</given-names></name> <etal/></person-group>. (<year>2003</year>). <article-title>The first intron of rice EPSP synthase enhances expression of foreign gene</article-title>. <source>Sci. China C Life Sci.</source> <volume>46</volume>, <fpage>561</fpage>&#x02013;<lpage>569</lpage>. <pub-id pub-id-type="doi">10.1360/02yc0120</pub-id><pub-id pub-id-type="pmid">18758713</pub-id></citation>
</ref>
<ref id="B96">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>L.</given-names></name> <name><surname>Lai</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Wei</surname> <given-names>C.</given-names></name> <name><surname>Tan</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name></person-group> (<year>2015</year>). <article-title>Analyses of the complete genome and gene expression of chloroplast of sweet potato [<italic>Ipomoea batata</italic>]</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e124083</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0124083</pub-id><pub-id pub-id-type="pmid">25874767</pub-id></citation>
</ref>
<ref id="B97">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Y.</given-names></name> <name><surname>Dang</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Q.</given-names></name> <name><surname>Lu</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name></person-group> (<year>2014</year>). <article-title>Complete chloroplast genome sequence of poisonous and medicinal plant datura stramonium: organizations and implications for genetic engineering</article-title>. <source>PLoS ONE</source> <volume>9</volume>:<fpage>e110656</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0110656</pub-id><pub-id pub-id-type="pmid">25365514</pub-id></citation>
</ref>
<ref id="B98">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yao</surname> <given-names>X.</given-names></name> <name><surname>Tang</surname> <given-names>P.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>D.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>H.</given-names></name></person-group> (<year>2015</year>). <article-title>The first complete chloroplast genome sequences in actinidiaceae: genome structure and comparative analysis</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e0129347</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0129347</pub-id><pub-id pub-id-type="pmid">26046631</pub-id></citation>
</ref>
<ref id="B99">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yi</surname> <given-names>D.</given-names></name> <name><surname>Kim</surname> <given-names>K.</given-names></name></person-group> (<year>2012</year>). <article-title>Complete chloroplast genome sequences of important oilseed crop <italic>Sesamum indicum</italic> L</article-title>. <source>PLoS ONE</source> <volume>7</volume>:<fpage>e35872</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0035872</pub-id><pub-id pub-id-type="pmid">22606240</pub-id></citation>
</ref>
<ref id="B100">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Young</surname> <given-names>N. D.</given-names></name> <name><surname>Debell&#x000E9;</surname> <given-names>F.</given-names></name> <name><surname>Oldroyd</surname> <given-names>G. E. D.</given-names></name> <name><surname>Geurts</surname> <given-names>R.</given-names></name> <name><surname>Cannon</surname> <given-names>S. B.</given-names></name> <name><surname>Udvardi</surname> <given-names>M. K.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>The Medicago genome provides insight into the evolution of rhizobial symbioses</article-title>. <source>Nature</source> <volume>480</volume>, <fpage>520</fpage>&#x02013;<lpage>524</lpage>. <pub-id pub-id-type="doi">10.1038/nature10625</pub-id><pub-id pub-id-type="pmid">22089132</pub-id></citation>
</ref>
</ref-list>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/genome/browse/">https://www.ncbi.nlm.nih.gov/genome/browse/</ext-link></p></fn>
<fn id="fn0002"><p><sup>2</sup><ext-link ext-link-type="uri" xlink:href="http://www.bioinformatics.babraham.ac.uk/projects/fastqc">http://www.bioinformatics.babraham.ac.uk/projects/fastqc</ext-link></p></fn>
<fn id="fn0003"><p><sup>3</sup><ext-link ext-link-type="uri" xlink:href="http://www.currentprotocols.com/WileyCDA/CurPro3Tool/toolId-7.html">http://www.currentprotocols.com/WileyCDA/CurPro3Tool/toolId-7.html</ext-link></p></fn>
<fn id="fn0004"><p><sup>4</sup><ext-link ext-link-type="uri" xlink:href="http://prep.unl.edu/">http://prep.unl.edu/</ext-link></p></fn>
<fn id="fn0005"><p><sup>5</sup><ext-link ext-link-type="uri" xlink:href="http://pgrc.ipk-gatersleben.de/misa/">http://pgrc.ipk-gatersleben.de/misa/</ext-link></p></fn>
</fn-group>
</back>
</article>