<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">867736</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2022.867736</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Repetitive Elements, Sequence Turnover and Cyto-Nuclear Gene Transfer in Gymnosperm Mitogenomes</article-title>
<alt-title alt-title-type="left-running-head">Liu et al.</alt-title>
<alt-title alt-title-type="right-running-head">Gymnosperm Mitogenomes</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Hui</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1498628/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhao</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1600687/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Ren-Gang</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mao</surname>
<given-names>Jian-Feng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/355122/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Xiao-Ru</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1660669/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>National Engineering Laboratory for Tree Breeding</institution>, <institution>Key Laboratory of Genetics and Breeding in Forest Trees and Ornamental Plants</institution>, <institution>Ministry of Education</institution>, <institution>The Tree and Ornamental Plant Breeding and Biotechnology Laboratory of National Forestry and Grassland Administration</institution>, <institution>College of Biological Sciences and Technology</institution>, <institution>Beijing Forestry University</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Ecology and Environmental Science</institution>, <institution>Ume&#xe5; Plant Science Centre</institution>, <institution>Ume&#xe5; University</institution>, <addr-line>Ume&#xe5;</addr-line>, <country>Sweden</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Bioinformatics</institution>, <institution>Ori (Shandong) Gene Science and Technology Co., Ltd.</institution>, <addr-line>Weifang</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/182524/overview">Jinhui Chen</ext-link>, Nanjing Forestry University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/243192/overview">Peng-Fei Ma</ext-link>, Kunming Institute of Botany (CAS), China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1494299/overview">Jia-Yu Xue</ext-link>, Nanjing Agricultural University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Wei Zhao, <email>zhao.wei@umu.se</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this work</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Evolutionary and Population Genetics, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>05</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>867736</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>02</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>04</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Liu, Zhao, Zhang, Mao and Wang.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Liu, Zhao, Zhang, Mao and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Among the three genomes in plant cells, the mitochondrial genome (mitogenome) is the least studied due to complex recombination and intergenomic transfer. In gymnosperms only &#x223c;20 mitogenomes have been released thus far, which hinders a systematic investigation into the tempo and mode of mitochondrial DNA evolution in seed plants. Here, we report the complete mitogenome sequence of <italic>Platycladus orientalis</italic> (Cupressaceae). This mitogenome is assembled as two circular-mapping chromosomes with a size of &#x223c;2.6&#xa0;Mb and which contains 32 protein-coding genes, three rRNA and seven tRNA genes, and 1,068 RNA editing sites. Repetitive sequences, including dispersed repeats, transposable elements (TEs), and tandem repeats, made up 23% of the genome. Comparative analyses with 17 other mitogenomes representing the five gymnosperm lineages revealed a 30-fold difference in genome size, 80-fold in repetitive content, and 230-fold in substitution rate. We found dispersed repeats are highly associated with mitogenome expansion (<italic>r</italic> &#x3d; 0.99), and most of them were accumulated during recent duplication events. Syntenic blocks and shared sequences between mitogenomes decay rapidly with divergence time (<italic>r</italic> &#x3d; 0.53), with the exceptions of Ginkgo and Cycads which retained conserved genome structure over long evolutionary time. Our phylogenetic analysis supports a sister group relationship of Cupressophytes and Gnetophytes; both groups are unique in that they lost 8&#x2013;12 protein-coding genes, of which 4&#x2013;7 intact genes are likely transferred to nucleus. These two clades also show accelerated and highly variable substitution rates relative to other gymnosperms. Our study highlights the dynamic and enigmatic evolution of gymnosperm mitogenomes.</p>
</abstract>
<kwd-group>
<kwd>
<italic>Platycladus orientalis</italic>
</kwd>
<kwd>gene transfer</kwd>
<kwd>gymnosperm mitogenome</kwd>
<kwd>rearrangement</kwd>
<kwd>repetitive sequences</kwd>
<kwd>substitution rate</kwd>
<kwd>sequence turnover</kwd>
<kwd>RNA editing</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Vetenskapsr&#xe5;det<named-content content-type="fundref-id">10.13039/501100004359</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>In contrast to the &#x223c;8,600 chloroplast (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>) and &#x223c;800 nuclear reference genomes assembled (<xref ref-type="bibr" rid="B31">Marks et al., 2021</xref>) for land plant taxa thus far, only &#x223c;350 mitogenomes have been released (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>; by November 2021). These published plant mitogenomes revealed extensive diversity in genome size, genome rearrangement, nucleotide substitution rate, and gene contents (<xref ref-type="bibr" rid="B39">Palmer and Herbon, 1988</xref>; <xref ref-type="bibr" rid="B2">Chaw et al., 2008</xref>; <xref ref-type="bibr" rid="B52">Smith and Keeling, 2015</xref>; <xref ref-type="bibr" rid="B35">Mower, 2020</xref>; <xref ref-type="bibr" rid="B61">Wu et al., 2020</xref>). In angiosperms, mitogenomes span a 170-fold range in size, from &#x223c;66&#xa0;Kb in <italic>Viscum scurruloideum</italic> to &#x223c;11.3&#xa0;Mb in <italic>Silene conica</italic> (<xref ref-type="bibr" rid="B49">Sloan et al., 2012</xref>; <xref ref-type="bibr" rid="B47">Skippington et al., 2015</xref>). The mechanisms contributing to the size variation are hypothesized to include horizontal transfer, intergenomic transfer, and repetitive sequence proliferation (<xref ref-type="bibr" rid="B12">Goremykin et al., 2012</xref>; <xref ref-type="bibr" rid="B43">Rice et al., 2013</xref>; <xref ref-type="bibr" rid="B16">Guo et al., 2017</xref>). For example, the mitogenome of the basal angiosperm <italic>Amborella trichopoda</italic> acquired &#x223c;20% of its sequences through horizontal transfer from green algae, mosses, and other plants (<xref ref-type="bibr" rid="B43">Rice et al., 2013</xref>), while apple and maize acquired 20&#x2013;78% of mitochondrial DNA (mtDNA) from their nuclei (<xref ref-type="bibr" rid="B12">Goremykin et al., 2012</xref>). The repeat content in 82 angiosperm mitogenomes ranged from 1.3% to 48.9% (<xref ref-type="bibr" rid="B9">Dong et al., 2018</xref>). A phylogenetic pattern in these traits is, however, not yet discernable.</p>
<p>Plant mitogenomes are often characterized by a strong dichotomy between rates of sequence and structural evolution (<xref ref-type="bibr" rid="B39">Palmer and Herbon, 1988</xref>). Analyses of the available mitogenomes show that while most plant lineages have low substitution rates, it is misleading to categorize all plants in this way; synonymous substitution rates are exceptionally variable, with four orders of magnitude across seed plants (<xref ref-type="bibr" rid="B34">Mower et al., 2007</xref>). The reason for such fluid substitution rates remains unclear.</p>
<p>Gymnosperms contain &#x223c;1,000 species representing five of the six main lineages of seed plants, including Cupressophytes, Pinaceae, Gnetophytes, Ginkgo, and Cycads (<xref ref-type="bibr" rid="B58">Wang and Ran, 2014</xref>). Up to now, only &#x223c;20 gymnosperm mitogenomes have been released, which are too few to allow a proper understanding of the properties and diversities of this genome. Despite the limited data, interesting and sometimes unexpected patterns of mtDNA variation have emerged. Similar to angiosperms, gymnosperm mitogenomes also show a wide range in size, with <italic>Ginkgo biloba</italic> (&#x223c;347&#xa0;Kb) and <italic>Larix sibirica</italic> (&#x223c;11.7&#xa0;Mb) being the extremes (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B41">Putintseva et al., 2020</xref>). The driving factors for this size heterogeneity are, however, debated because estimations of repetitive contents and nucleus-derived sequences vary among studies (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B21">Kan et al., 2020</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>).</p>
<p>Fast structural rearrangement of gymnosperm mitogenomes is reported to result in a substantial loss of synteny and shared sequences between closely related species with divergence times as small as 15 million years ago (MYA) (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B5">Cole et al., 2018</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>). On the other hand, conserved structures and high degrees of synteny are found between <italic>Cycas</italic> and <italic>Ginkgo</italic> that diversified &#x3e;300 MYA (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>). Parallel to this unpredictable structural diversity are the highly variable substitution rates among the taxa (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Kan et al., 2021</xref>). In addition, the number of protein-coding and other genes vary between gymnosperm lineages (<xref ref-type="bibr" rid="B15">Guo et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Kan et al., 2021</xref>). These observations show a largely lineage-specific mode of mitogenome evolution in gymnosperms, but the mechanisms and phylogenetic patterns for this diversity are unclear due to sparse sampling and limited analyses.</p>
<p>In this study, we report a complete mitogenome assembly of <italic>Platycladus orientalis</italic>, Cupressaceae (Cupressophytes). Cupressaceae is the largest conifer family with 25 genera; <italic>Platycladus</italic> is a monotypic genus in this family. This new genome thus fills a gap in the still sparse coverage for this clade. We then sampled 17 gymnosperm and two angiosperm mitogenomes, representing all six major lineages of seed plants, to characterize gene content, transposable elements (TEs), dispersed repeats, tandem repeats, sequence turnover, structural rearrangement and substitution rate variation. We provide quantitative estimates of the role of repetitive elements in genome expansion, the mode of repeats accumulation, and the rate of synteny decay among taxa. Our results reinforce some early observations but also shed new light on the dynamics of mitogenome evolution.</p>
</sec>
<sec id="s2">
<title>2 Materials and Methods</title>
<sec id="s2-1">
<title>2.1 Mitochondrial Genome Assembly and Annotation</title>
<p>We collected fresh young leaves of <italic>P. orientalis</italic> from an elite tree in a seed orchard in Jiaxian, Henan Province, China. DNA used for Illumina sequencing was isolated using a cetyl trimethyl ammonium bromide (CTAB)-based method (<xref ref-type="bibr" rid="B10">Doyle and Doyle, 1987</xref>). For the Oxford Nanopore Technologies (ONT) sequencing, we prepared DNA using a DNeasy Plant Mini Kit (QIAGEN). A short-insert 2 &#xd7; 150&#xa0;bp pair-end library was constructed following the manufacturer&#x2019;s PCR-free protocol (Illumina) and sequenced on an Illumina NovaSeq 6000 platform. Library for ONT sequencing was prepared following the Nanopore 1D Genomic DNA by ligation (SQK-LSK109)&#x2013;PromethION protocol, and sequenced on a PromethION platform. The short reads from Illumina were filtered using fastp v0.21.0 (<xref ref-type="bibr" rid="B3">Chen et al., 2018</xref>) with parameters of &#x201c;-q 20 -l 36 --cut_right --n_base_limit 0 -c.&#x201d; The long reads from Nanopore were corrected using NextDenovo v1.1.0 (<ext-link ext-link-type="uri" xlink:href="https://github.com/Nextomics/NextDenovo">https://github.com/Nextomics/NextDenovo</ext-link>). We generated &#x223c;110&#xa0;Gb Illumina clean short reads and &#x223c;808&#xa0;Gb (40.3&#xa0;M reads with a N50 of 25&#xa0;Kb) corrected ONT long reads.</p>
<p>We applied a long and short reads hybrid strategy to assemble the <italic>P. orientalis</italic> mitogenome. First, the clean short reads were <italic>de novo</italic> assembled using GetOrganelle v1.6.4 (<xref ref-type="bibr" rid="B19">Jin et al., 2020</xref>) with parameters of &#x201c;-R 50 -k 67,87,107,127 -F embplant_mt --reduce-reads-for-coverage inf -w 127 -t 12 --max-reads 7.5E8&#x201d;. The resulting unitig graph was manually edited using Bandage v0.8.1 (<xref ref-type="bibr" rid="B60">Wick et al., 2015</xref>) to remove chloroplast- and nuclear-derived unitig nodes. The corrected long reads were then mapped to the graph using the minimap2 v2.24-r1122 (<xref ref-type="bibr" rid="B27">Li, 2018</xref>). Finally, repeats on the graph were resolved by aligning with the mapped long reads.</p>
<p>The protein-coding genes, non-coding rRNA, and tRNA genes were annotated using the Organelle Genome Annotation Pipeline (OGAP, <ext-link ext-link-type="uri" xlink:href="https://github.com/zhangrengang/OGAP">https://github.com/zhangrengang/OGAP</ext-link>) with parameters of &#x201c;-taxon Acrogymnospermae Bryophyta Liliopsida commelinids fabids malvids -mt -trn_struct&#x201d;. More specifically, protein-coding genes were identified with Exonerate v2.2.0 (<xref ref-type="bibr" rid="B48">Slater and Birney, 2005</xref>) and AUGUSTUS v3.3.3 (<xref ref-type="bibr" rid="B53">Stanke et al., 2008</xref>), tRNA genes with tRNAscan-SE v2.0.5 (<xref ref-type="bibr" rid="B29">Lowe and Eddy, 1997</xref>), and rRNA genes with BLAT v36x2 (<xref ref-type="bibr" rid="B23">Kent, 2002</xref>) within the OGAP.</p>
<p>RNA editing sites in protein-coding genes of each species were predicted using the PREP-Mt (<xref ref-type="bibr" rid="B33">Mower, 2005</xref>) with a cutoff of 0.2. To validate the accuracy of the predictions, we searched for RNAseq data of <italic>P. orientalis</italic> (<xref ref-type="sec" rid="s11">Supplementary Table S1</xref>) and mapped them to the protein-coding genes with bwa mem v0.7.17-r1188 (<xref ref-type="bibr" rid="B26">Li, 2013</xref>) to determine the edited sites using REDItoolDenovo v1.3 (<xref ref-type="bibr" rid="B28">Lo Giudice et al., 2020</xref>) with minimum coverage of 10 and mapping quality score of 30.</p>
</sec>
<sec id="s2-2">
<title>2.2 Repetitive Sequences</title>
<p>To estimate the repetitive sequences in mitogenomes, we annotated tandem repeats, TEs, and dispersed repeats in <italic>P. orientalis</italic> and 19 other taxa representing the six major lineages of seed plants included in this study (<xref ref-type="table" rid="T1">Table 1</xref>). Tandem repeats were identified using Tandem Repeats Finder v4.10.0 with the parameters of &#x201c;2 7 7 80 10 50 800 -d&#x201d; (<xref ref-type="bibr" rid="B1">Benson, 1999</xref>). For TEs, we first used the <italic>de novo</italic> TE family identification and modeling package RepeatModeler v1.0.10 (<xref ref-type="bibr" rid="B51">Smit and Hubley, 2008</xref>) to train a TE database from each mitogenome. The RepeatModeler derived library was then combined with the database &#x201c;RepeatMasker.lib&#x201d; of RepeatMasker v4.07 (<xref ref-type="bibr" rid="B50">Smit et al., 2013</xref>) and the repeat library of <italic>Picea abies</italic> v1.0 assembly (<xref ref-type="bibr" rid="B38">Nystedt et al., 2013</xref>) to generate a joint repeats library. Finally, TEs in each genome were identified by RepeatMasker using this reference database.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Summary of the 20 plant mitogenomes.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Lineage</th>
<th align="center">Species</th>
<th align="center">Genome size (Kb)</th>
<th align="center">No. scaffolds</th>
<th align="center">GC (%)</th>
<th align="center">Accession number</th>
<th align="center">References</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="center">2,624</td>
<td align="char" char=".">2</td>
<td align="char" char=".">50.60</td>
<td align="center">OL703044-45</td>
<td align="left">This study</td>
</tr>
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Cupressus sempervirens</italic>
</td>
<td align="center">2,743</td>
<td align="char" char=".">238</td>
<td align="char" char=".">50.64</td>
<td align="center">MN965161-90</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Hesperocyparis glabra</italic>
</td>
<td align="center">1,967</td>
<td align="char" char=".">129</td>
<td align="char" char=".">50.02</td>
<td align="center">MN965210-41</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Taxus cuspidata</italic>
</td>
<td align="center">469</td>
<td align="char" char=".">1</td>
<td align="char" char=".">50.39</td>
<td align="center">MN593023</td>
<td align="left">
<xref ref-type="bibr" rid="B21">Kan et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Podocarpus macrophyllus</italic>
</td>
<td align="center">2,021</td>
<td align="char" char=".">85</td>
<td align="char" char=".">47.44</td>
<td align="center">MN965338-58</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cupressophytes</td>
<td align="left">
<italic>Araucaria heterophylla</italic>
</td>
<td align="center">1,384</td>
<td align="char" char=".">52</td>
<td align="char" char=".">46.80</td>
<td align="center">MN965108-21</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Gnetophytes</td>
<td align="left">
<italic>Gnetum gnemon</italic>
</td>
<td align="center">640</td>
<td align="char" char=".">44</td>
<td align="char" char=".">47.88</td>
<td align="center">MN965191-209</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Gnetophytes</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="center">979</td>
<td align="char" char=".">1</td>
<td align="char" char=".">53.02</td>
<td align="center">NC_029130</td>
<td align="left">
<xref ref-type="bibr" rid="B14">Guo et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Picea abies</italic>
</td>
<td align="center">4,899</td>
<td align="char" char=".">4</td>
<td align="char" char=".">44.67</td>
<td align="center">MN642623-626</td>
<td align="left">
<xref ref-type="bibr" rid="B54">Sullivan et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Picea glauca</italic>
</td>
<td align="center">5,995</td>
<td align="char" char=".">36</td>
<td align="char" char=".">44.67</td>
<td align="center">LKAM00000000</td>
<td align="left">
<xref ref-type="bibr" rid="B18">Jackman et al. (2015)</xref>
</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Pinus lambertiana</italic>
</td>
<td align="center">4,021</td>
<td align="char" char=".">262</td>
<td align="char" char=".">44.91</td>
<td align="center">NA</td>
<td align="left">
<xref ref-type="bibr" rid="B59">Wegrzyn et al. (2008)</xref>
</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Pinus taeda</italic>
</td>
<td align="center">1,191</td>
<td align="char" char=".">1</td>
<td align="char" char=".">46.67</td>
<td align="center">NC_039746</td>
<td align="left">NA</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Larix sibirica</italic>
</td>
<td align="center">11,663</td>
<td align="char" char=".">9</td>
<td align="char" char=".">41.90</td>
<td align="center">MT797187-95</td>
<td align="left">
<xref ref-type="bibr" rid="B41">Putintseva et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Pinaceae</td>
<td align="left">
<italic>Abies sibirica</italic>
</td>
<td align="center">1,485</td>
<td align="char" char=".">237</td>
<td align="char" char=".">45.73</td>
<td align="center">MN965088-107</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Ginkgo</td>
<td align="left">
<italic>Ginkgo biloba</italic>
</td>
<td align="center">347</td>
<td align="char" char=".">1</td>
<td align="char" char=".">50.36</td>
<td align="center">NC_027976</td>
<td align="left">
<xref ref-type="bibr" rid="B14">Guo et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left">Cycads</td>
<td align="left">
<italic>Ceratozamia hildae</italic>
</td>
<td align="center">412</td>
<td align="char" char=".">85</td>
<td align="char" char=".">47.54</td>
<td align="center">MN965122-60</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cycads</td>
<td align="left">
<italic>Zamia integrifolia</italic>
</td>
<td align="center">469</td>
<td align="char" char=".">96</td>
<td align="char" char=".">47.59</td>
<td align="center">MN965050-87</td>
<td align="left">
<xref ref-type="bibr" rid="B15">Guo et al. (2020)</xref>
</td>
</tr>
<tr>
<td align="left">Cycads</td>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="center">415</td>
<td align="char" char=".">1</td>
<td align="char" char=".">46.92</td>
<td align="center">NC_010303</td>
<td align="left">
<xref ref-type="bibr" rid="B2">Chaw et al. (2008)</xref>
</td>
</tr>
<tr>
<td align="left">Angiosperm</td>
<td align="left">
<italic>Amborella trichopoda</italic>
</td>
<td align="center">3,866</td>
<td align="char" char=".">5</td>
<td align="char" char=".">45.92</td>
<td align="center">KF754799-803</td>
<td align="left">
<xref ref-type="bibr" rid="B43">Rice et al. (2013)</xref>
</td>
</tr>
<tr>
<td align="left">Angiosperm</td>
<td align="left">
<italic>Liriodendron tulipifera</italic>
</td>
<td align="center">554</td>
<td align="char" char=".">1</td>
<td align="char" char=".">47.70</td>
<td align="center">KC821969</td>
<td align="left">
<xref ref-type="bibr" rid="B44">Richardson et al. (2013)</xref>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Dispersed repeats were identified with a BLASTN search using a word size of seven and an e-value of 1<italic>E</italic>-6 as in a previous study (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>). Overlapping regions of dispersed repeats were counted only once when calculating their total size. The dispersed repeats were grouped into small-, medium-, and large-size classes with sequence lengths of &#x3c;100 bp, 100&#x2013;1,000 bp, and &#x2265;1,000 bp, respectively. Divergence among repeats was estimated using Kimura two-parameter distance (K2P) (<xref ref-type="bibr" rid="B24">Kimura, 1980</xref>) for pairwise repeat sequences.</p>
</sec>
<sec id="s2-3">
<title>2.3 Identify Mitochondrial Genes From Transcriptomes</title>
<p>Based on gene annotation results, we found 8&#x2013;12 genes were absent in mitogenomes of Cupressophytes and Gnetophytes (see <xref ref-type="sec" rid="s3-3">Section 3.3</xref>). To investigate the possibility of their transfer to nuclei, we first tried to recover these genes from transcriptomes. We searched for RNAseq data of Cupressophytes and Gnetophytes in NCBI (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>), and <italic>de novo</italic> assembled transcriptomes for <italic>Cupressus sempervirens</italic>, <italic>Hesperocyparis glabra</italic>, <italic>Taxus cuspidata</italic>, <italic>Podocarpus macrophyllus</italic>, <italic>Gnetum gnemon</italic>, and <italic>Welwitschia mirabilis</italic> (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>)<italic>.</italic> The Illumina reads were filtered using fastp v0.21.0 (<xref ref-type="bibr" rid="B3">Chen et al., 2018</xref>) with the parameters of &#x201c;-q 20 -l 36 --cut_right --n_base_limit 0 -c,&#x201d; generating 6.3&#x2013;14.7&#xa0;Gb clean reads per species. We then <italic>de novo</italic> assembled the transcriptomes using Trinity v2.8.5 with default parameters (<xref ref-type="bibr" rid="B13">Grabherr et al., 2011</xref>). The transcriptome of <italic>P. orientalis</italic> is from our early study (<xref ref-type="bibr" rid="B17">Hu et al., 2016</xref>). For <italic>Araucaria heterophylla</italic>, we only found 212 ESTs/cDNAs in TreeGenes database (<xref ref-type="bibr" rid="B59">Wegrzyn et al., 2008</xref>) (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). We searched for intact mitochondrial genes in these transcriptomes and ESTs/cDNAs using OGAP with the parameters of &#x201c;-taxon Acrogymnospermae Bryophyta Liliopsida commelinids fabids malvids -mt -trn_struct -trans&#x201d;. Potential chloroplast genes were filtered out after BLAST against NCBI&#x2019;s NT database (<italic>E</italic>-value &#x3c; 1<italic>E</italic>-40, sequence coverage &#x3e;99%, and sequence identity &#x3e;99%).</p>
<p>Second, to confirm that the transcriptome-recovered mitochondrial genes (mitogenes) were in nuclear genomes, we used TBLASTN to search for matches of these genes in reference genomes of Cupressophytes and Gnetophytes, including <italic>Sequoiadendron giganteum</italic> (<xref ref-type="bibr" rid="B46">Scott et al., 2020</xref>), <italic>Sequoia sempervirens</italic> (<xref ref-type="bibr" rid="B36">Neale et al., 2021</xref>), <italic>Taxus chinensis</italic> (<xref ref-type="bibr" rid="B63">Xiong et al., 2021</xref>), <italic>Taxus wallichiana</italic> (<xref ref-type="bibr" rid="B4">Cheng et al., 2021</xref>), <italic>Gnetum montanum</italic> (<xref ref-type="bibr" rid="B56">Wan et al., 2018</xref>), and <italic>Welwitschia mirabilis</italic> (<xref ref-type="bibr" rid="B57">Wan et al., 2021</xref>) (<xref ref-type="sec" rid="s11">Supplementary Table S3</xref>).</p>
<p>Third, we used mapping depth of reads of resequencing data to verify the genome origins of the transcriptome-recovered mitogenes. In a plant cell, the abundance of nuclear and organelle genomes can differ by thousands fold with the copy numbers of plastid the highest, mitochondrial intermediate and nuclear the lowest (<xref ref-type="bibr" rid="B40">Petit and Vendramin, 2007</xref>). Based on this expectation, we investigated the depth of read coverage of each recovered genes. The mitochondrial genes retrieved from mitogenome and transcriptomes were used as reference. We also include the low-copy nuclear gene <italic>LEAFY</italic> and chloroplast gene <italic>matK</italic> as spike-in reference. We downloaded whole-genome resequencing data of <italic>Cupressus sempervirens</italic>, <italic>Hesperocyparis glabra</italic>, <italic>Taxus cuspidata</italic>, <italic>Podocarpus macrophyllus</italic>, <italic>Gnetum gnemon</italic>, and <italic>Welwitschia mirabilis</italic> from Sequence Read Archive (SRA) of NCBI (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/sra">https://www.ncbi.nlm.nih.gov/sra</ext-link>) (<xref ref-type="sec" rid="s11">Supplementary Table S4</xref>), the resequencing data of <italic>P. orientalis</italic> is from this study. The Illumina reads were filtered using fastp v0.21.0 (<xref ref-type="bibr" rid="B3">Chen et al., 2018</xref>) with the same parameters as in <xref ref-type="sec" rid="s2-1">Section 2.1</xref>, generating 7.2&#x2013;31.4&#xa0;Gb clean reads per species. The clean reads were mapped to the reference genes using bwa mem v0.7.17-r1188 with default parameters. The resulting sequence alignment maps (SAMs) were sorted with SAMtools v1.14 (<ext-link ext-link-type="uri" xlink:href="https://github.com/samtools/samtools">https://github.com/samtools/samtools</ext-link>), reads with alignment score (AS) &#x3c;25 were removed by using ngsutilsj (<ext-link ext-link-type="uri" xlink:href="https://github.com/compgen-io/ngsutilsj">https://github.com/compgen-io/ngsutilsj</ext-link>). We used SAMtools to compute the depth of the aligned reads at each position of the gene.</p>
</sec>
<sec id="s2-4">
<title>2.4 Genome Alignments and Shared DNA Blocks</title>
<p>To identify synteny blocks among the mitogenomes of the major gymnosperm lineages, we performed pairwise genome alignment using Mauve v2.4.0 with default parameters (<xref ref-type="bibr" rid="B7">Darling et al., 2010</xref>). To calculate the degree of shared DNA between species, each pair of mitogenomes were aligned using BLASTN with a word size of seven and an <italic>E</italic>-value of 1<italic>E</italic>-6.</p>
</sec>
<sec id="s2-5">
<title>2.5 Phylogenetic Analysis and Estimation of Nucleotide Substitution Rates</title>
<p>We used 28 protein-coding genes shared among all 20 mitogenomes included in this study to reconstruct a phylogenetic tree. Edited protein sequences were individually aligned with MAFFT v7.453 with default parameters and converted into the corresponding edited codon sequence alignments. Poorly aligned regions were trimmed using BMGE v1.1 (<xref ref-type="bibr" rid="B6">Criscuolo and Gribaldo, 2010</xref>) with parameters of &#x201c;-t CODON -g 0.5.&#x201d; The trimmed alignments of each gene were concatenated into a single alignment of 26,844&#xa0;bp. This alignment was used to build a maximum-likelihood (ML) phylogenetic tree using IQ-TREE v1.6.12 (<xref ref-type="bibr" rid="B37">Nguyen et al., 2015</xref>), using the best-fit model TVM &#x2b; F &#x2b; R3 selected by ModelFinder (<xref ref-type="bibr" rid="B20">Kalyaanamoorthy et al., 2017</xref>) and with 1,000 replications of ultrafast bootstrap and Shimodaira-Hasegawa-like approximate likelihood-ratio (SH-aLRT) test. The branch lengths in units of synonymous (d<italic>S</italic>) and nonsynonymous (d<italic>N</italic>) substitution rates were estimated under the free-ratio branch model using codeml in PAML v4.9j package (<xref ref-type="bibr" rid="B64">Yang, 2007</xref>).</p>
<p>To estimate the divergence time between lineages, we run the MCMCTree in PAML v4.9j (<xref ref-type="bibr" rid="B64">Yang, 2007</xref>) for 2,000,000 iterations and 100,000 iterations for a burn-in. To calibrate the tree, we used the following time points of diversification from the TimeTree web (<ext-link ext-link-type="uri" xlink:href="http://www.timetree.org/">http://www.timetree.org/</ext-link>): 289&#x2013;337 MYA between gymnosperms and angiosperms, 282&#x2013;324 MYA between Cycads and other gymnosperm clades, 159&#x2013;246 MYA between <italic>Cycas taitungensis</italic> and the other Cycads species, 134&#x2013;197 MYA between <italic>Abies sibirica</italic> and other species within Pinaceae, 7.6 to 30.7 MYA between <italic>Picea abies</italic> and <italic>Picea glauca</italic>, 59&#x2013;87 MYA between <italic>Pinus taeda</italic> and <italic>Pinus lambertiana</italic>, 99&#x2013;123 MYA between <italic>Gnetum gnemon</italic> and <italic>Welwitschia mirabilis</italic>, and 213&#x2013;272 MYA between the clades consisting of <italic>Podocarpus macrophyllus</italic> and <italic>Araucaria heterophylla</italic> and the other species of Cupressophytes.</p>
</sec>
</sec>
<sec id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 The Mitogenome of <italic>P. orientalis</italic>
</title>
<p>We assembled the mitogenome of <italic>P. orientalis</italic> into two circular-mapping chromosomes representing a master ring and a sub-genomic ring with a total size of &#x223c;2.6&#xa0;Mb (<xref ref-type="fig" rid="F1">Figure 1A</xref>, <xref ref-type="table" rid="T2">Table 2</xref>). This genome lacks large structural variants but is rich in dispersed repeats (<xref ref-type="fig" rid="F1">Figures 1B,C</xref>). The genome size is similar to <italic>C. sempervirens</italic> (2.7&#xa0;Mb) and <italic>H. glabra</italic> (2.0&#xa0;Mb) in the family of Cupressaceae, but more than 5-fold larger than <italic>T. cuspidata</italic> and &#x223c;2&#x2013;4 fold smaller than <italic>Picea</italic> and <italic>Larix</italic> in Pinaceae (<xref ref-type="table" rid="T1">Table 1</xref>). Across the Cupressophytes and Pinaceae, the mitogenomes vary 6&#x2013;10 fold in size, in contrast to the relatively stable and small genomes in Cycads and Gnetophytes.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The mitogenome assembly of <italic>Platycladus orientalis.</italic> <bold>(A)</bold> The order, orientation, and size of genes on the two chromosomes of <italic>P. orientalis</italic> mitogenome. The <italic>nad1</italic>, <italic>nad2</italic>, <italic>nad4</italic>, <italic>nad5</italic>, and <italic>cox2</italic> are <italic>trans</italic>-splicing genes. Each box is proportional to the size of the gene including introns; genes with &#x3c;200 nucleotides are shown as 200 nucleotides. Intergenic regions are not to scale. <bold>(B)</bold> The dot plot shows self-alignment. Dots represent the homology sequences with length &#x3e;100&#xa0;bp. <bold>(C)</bold> Distribution of dispersed repeats. Large-size repeats &#x2265;1,000&#xa0;bp in length are indicated in red, medium-size repeats in the range of 100&#x2013;1,000&#xa0;bp are in orange, and small-size repeats &#x3c;100&#xa0;bp are in blue. The numbers on the ring anchor genome coordinates in kilobases.</p>
</caption>
<graphic xlink:href="fgene-13-867736-g001.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Characteristics of the <italic>Platycladus orientalis</italic> mitogenome.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Feature</th>
<th align="center">Values</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Genome size</td>
<td align="center">2,624&#xa0;Kb</td>
</tr>
<tr>
<td align="left">GC content</td>
<td align="center">50.6%</td>
</tr>
<tr>
<td align="left">Protein-coding genes</td>
<td align="center">32 (41&#xa0;Kb)</td>
</tr>
<tr>
<td align="left">
<italic>cis</italic>-spliced introns</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">
<italic>trans-</italic>spliced introns</td>
<td align="center">10</td>
</tr>
<tr>
<td align="left">Predicted RNA editing sites</td>
<td align="center">1,007</td>
</tr>
<tr>
<td align="left">Observed RNA editing sites</td>
<td align="center">1,068</td>
</tr>
<tr>
<td align="left">tRNAs</td>
<td align="center">7</td>
</tr>
<tr>
<td align="left">rRNAs</td>
<td align="center">3</td>
</tr>
<tr>
<td align="left">Chloroplast genes</td>
<td align="center">9 (6&#xa0;Kb)</td>
</tr>
<tr>
<td align="left">Repetitive sequences</td>
<td align="center">608&#xa0;Kb (23.2%)</td>
</tr>
<tr>
<td align="left">Tandem repeats</td>
<td align="center">123&#xa0;Kb (4.7%)</td>
</tr>
<tr>
<td align="left">Transposable elements (TEs)</td>
<td align="center">157&#xa0;Kb (6.0%)</td>
</tr>
<tr>
<td align="left">Dispersed repeats</td>
<td align="center">541&#xa0;Kb (20.6%)</td>
</tr>
<tr>
<td align="left">Undefined sequences</td>
<td align="center">1,983&#xa0;Kb (75.6%)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The mitogenome of <italic>P. orientalis</italic> contains 32 distinct protein-coding genes (<xref ref-type="fig" rid="F1">Figure 1A</xref>, <xref ref-type="table" rid="T2">Table 2</xref>), seven tRNA genes (<italic>Asp-trnD-GUC</italic>, <italic>Glu-trnE-UUC</italic>, <italic>Ile-trnI-CAU</italic>, <italic>Met-trnM-CAU</italic>, <italic>Met-trnfM-CAU</italic>, <italic>Trp-trnW-CCA</italic>, and <italic>Tyr-trnY-GUA</italic>), and three rRNA genes. Among them, <italic>ccmFC</italic> and <italic>cox1</italic> have four copies, <italic>rrn5</italic>, <italic>rrn18</italic>, and <italic>rrn26</italic> have three copies, <italic>nad1</italic>, <italic>trnD-GUC</italic>, <italic>trnE-UUC</italic>, <italic>trnM-CAU</italic>, and <italic>trnfM-CAU</italic> have two copies. We found five <italic>cis</italic>-spliced introns and 10 <italic>trans</italic>-spliced introns in the protein-coding genes (<xref ref-type="sec" rid="s11">Supplementary Table S5</xref>). Both the number of protein-coding genes (<xref ref-type="fig" rid="F2">Figure 2B</xref>) and the number of <italic>cis</italic>- and <italic>trans</italic>-spliced introns identified in <italic>P. orientalis</italic> are similar to that of Cupressophytes taxa reported previously (<xref ref-type="bibr" rid="B15">Guo et al., 2020</xref>). We also detected seven complete chloroplast genes (although they may not be functional), <italic>atpA</italic>, <italic>ndhA</italic>, <italic>ndhB</italic>, <italic>ndhC</italic>, <italic>ndhD</italic>, <italic>ndhE</italic>, and <italic>ndhH,</italic> and two chloroplast pseudogenes, <italic>petB</italic> and <italic>petD,</italic> in the mitogenome of <italic>P. orientalis</italic> (<xref ref-type="table" rid="T2">Table 2</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Phylogeny and gene content of the 20 mitogenomes included in this study. <bold>(A)</bold> The phylogenetic tree among major gymnosperm lineages based on 28 shared genes. Numbers next to nodes indicate bootstrap values from 1,000 replicates, and blue bars correspond to the 95% highest posterior density (HPD) of divergence time. Period is shown at the bottom of the tree. Ca., Carboniferous; Pe. Permian; Tr. Triassic; Ju. Jurassic; Cr. Cretaceous; Pa. Paleogene; N. Neogene. <bold>(B)</bold> Gene contents in the 20 mitogenomes. The 28 shared genes are <italic>atp</italic>[1, 4, 6, 8, 9], <italic>ccm</italic>[<italic>B</italic>, <italic>C</italic>, <italic>Fc</italic>, <italic>Fn</italic>], <italic>cob</italic>, <italic>cox</italic>[1&#x2013;3], <italic>matR</italic>, <italic>mttB</italic>, <italic>nad</italic>[1, 2, 3, 4, 4L, 5, 6, 7, 9], <italic>rps</italic>[3, 4, 12], and <italic>sdh</italic>4. Intact genes are indicated by dark blue blocks and missing genes in white. The lost genes that are confirmed as transferred to nucleus are highlighted in orange. Pseudogenes are indicated as &#x3c8;. <bold>(C)</bold> RNA editing sites in the 20 mitogenomes. The two plots in the far right show the number of editing sites for all genes and the 28 shared genes, respectively. <bold>(D)</bold> Nucleotide substitution rates in the 20 mitogenomes. Branch lengths are proportional to rates of synonymous (d<italic>S</italic>) and nonsynonymous (d<italic>N</italic>) substitutions inferred by the maximum-likelihood method implemented in PAML.</p>
</caption>
<graphic xlink:href="fgene-13-867736-g002.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 RNA Editing, Mitochondrial Genes-Based Phylogeny, and Variable Substitution Rates in Cupressophytes and Gnetophytes</title>
<p>RNA editing remodels variability in higher plant mitogenomes, and could bias phylogenetic inferences if not accounted for (<xref ref-type="bibr" rid="B55">Szmidt et al., 2001</xref>; <xref ref-type="bibr" rid="B33">Mower, 2005</xref>). We predicted the RNA editing sites in protein coding genes of all 20 species and found that Ginkgo (1,300 sites) and Gnetophytes (225&#x2013;336 sites) had the highest and lowest C-to-U editing sites across all protein-coding regions, respectively, and the other species spanned a range of 520&#x2013;1,220 sites (<xref ref-type="fig" rid="F2">Figure 2C</xref>). This variation in editing frequency reflects a lineage-specific pattern of editing, for example 25% (254) and 44&#x2013;45% (102&#x2013;147) of the editing sites in Ginkgo and Gnetophytes were unique (<xref ref-type="fig" rid="F2">Figure 2C</xref>). In contrast, <italic>C. sempervirens</italic> and <italic>H. glabra</italic> of Cupressophytes each had only 6% (43&#x2013;47) unique sites (<xref ref-type="fig" rid="F2">Figure 2C</xref>).</p>
<p>To assess the accuracy of the predicted editing sites, we identified the edited sites from RNAseq data in <italic>P. orientalis</italic>. A total of 1,068&#xa0;C-to-U edit sites were detected in 32 genes, of which 745 sites were among the 1,007 predicted sites (<xref ref-type="table" rid="T2">Table 2</xref>, <xref ref-type="sec" rid="s11">Supplementary Table S6</xref>). This comparison suggests that the prediction method provides a reasonably reliable estimate of RNA editing (74% in <italic>P. orientalis</italic>), consistent with the results from a previous study (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>).</p>
<p>We inferred the phylogeny of the major gymnosperm lineages using 28 conserved protein-coding genes common to all 20 species included in this study. The concatenated sequence alignment consisted 26,844 sites. On this phylogenetic tree, Cupressophytes and Gnetophytes are sister clades with a strong bootstrap support of 92% (<xref ref-type="fig" rid="F2">Figure 2A</xref>). Within Cupressophytes, <italic>P. orientalis</italic> is sister to the group consisting of <italic>C. sempervirens</italic> and <italic>H. glabra</italic> (<xref ref-type="fig" rid="F2">Figure 2A</xref>), and diverged from this group 87 MYA in the Paleogene. The divergence of the Cupressaceae family is dated to 145 MYA (<xref ref-type="fig" rid="F2">Figure 2A</xref>), which is similar to the 159 MYA estimate from nuclear data (<xref ref-type="bibr" rid="B8">De La Torre et al., 2017</xref>).</p>
<p>To evaluate the substitution rates in mitochondrial genes, we estimated synonymous (d<italic>S</italic>) and nonsynonymous (d<italic>N</italic>) substitution rates along the branches of the inferred phylogeny. We found that d<italic>S</italic> and d<italic>N</italic> varied up to 46- and 234-fold among species, respectively. This wide range is mainly caused by Cupressophytes and Gnetophytes with their substantially longer branches and larger variation in d<italic>S</italic> and d<italic>N</italic> among species (<xref ref-type="fig" rid="F2">Figure 2D</xref>; <xref ref-type="table" rid="T3">Table 3</xref>) compared to the other clades, all of which have low substitution rates. The overall d<italic>S</italic> of Cupressophytes and Gnetophytes is more than 5-fold higher than Pinaceae. The same overall pattern is seen with d<italic>N</italic>, although it is about 20&#x2013;70% of the d<italic>S</italic> values, reflecting selective constraints on nonsynonymous mutations (<xref ref-type="fig" rid="F2">Figure 2D</xref>; <xref ref-type="table" rid="T3">Table 3</xref>). Within Cupressophytes, d<italic>S</italic> varied by 46-fold and d<italic>N</italic> varied by 25-fold among lineages, with <italic>P. orientalis</italic> at the low end for both values (d<italic>S &#x3d;</italic> 0.0030, d<italic>N</italic> &#x3d; 0.0015; <xref ref-type="table" rid="T3">Table 3</xref>).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Relative (d<italic>S</italic>, d<italic>N</italic>) and absolute (R<italic>S</italic>, R<italic>N</italic>) synonymous and nonsynonymous substitution rates. MYA, million years ago.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Species</th>
<th align="center">Time (MYA)</th>
<th align="center">d<italic>S</italic>
</th>
<th align="center">R<italic>S</italic> (site/year)</th>
<th align="center">d<italic>N</italic>
</th>
<th align="center">R<italic>N</italic> (site/year)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="char" char=".">87</td>
<td align="char" char=".">0.002997</td>
<td align="center">3.44483E-11</td>
<td align="char" char=".">0.001498</td>
<td align="center">1.72184E-11</td>
</tr>
<tr>
<td align="left">
<italic>Cupressus sempervirens</italic>
</td>
<td align="char" char=".">31</td>
<td align="char" char=".">0.004554</td>
<td align="center">1.46903E-10</td>
<td align="char" char=".">0.003375</td>
<td align="center">1.08871E-10</td>
</tr>
<tr>
<td align="left">
<italic>Hesperocyparis glabra</italic>
</td>
<td align="char" char=".">31</td>
<td align="char" char=".">0.042915</td>
<td align="center">1.38435E-09</td>
<td align="char" char=".">0.037602</td>
<td align="center">1.21297E-09</td>
</tr>
<tr>
<td align="left">Cupressaceae</td>
<td align="char" char=".">145</td>
<td align="char" char=".">0.050927</td>
<td align="center">3.51221E-10</td>
<td align="char" char=".">0.016829</td>
<td align="center">1.16062E-10</td>
</tr>
<tr>
<td align="left">
<italic>Taxus cuspidata</italic>
</td>
<td align="char" char=".">145</td>
<td align="char" char=".">0.037293</td>
<td align="center">2.57193E-10</td>
<td align="char" char=".">0.014685</td>
<td align="center">1.01276E-10</td>
</tr>
<tr>
<td align="left">
<italic>Podocarpus macrophyllus</italic>
</td>
<td align="char" char=".">127</td>
<td align="char" char=".">0.137564</td>
<td align="center">1.08318E-09</td>
<td align="char" char=".">0.017518</td>
<td align="center">1.37937E-10</td>
</tr>
<tr>
<td align="left">
<italic>Araucaria heterophylla</italic>
</td>
<td align="char" char=".">127</td>
<td align="char" char=".">0.077235</td>
<td align="center">6.08150E-10</td>
<td align="char" char=".">0.019114</td>
<td align="center">1.50504E-10</td>
</tr>
<tr>
<td align="left">
<bold>Cupressophytes</bold>
</td>
<td align="char" char=".">
<bold>252</bold>
</td>
<td align="char" char=".">
<bold>0.064140</bold>
</td>
<td align="center">
<bold>2.54524E-10</bold>
</td>
<td align="char" char=".">
<bold>0.018398</bold>
</td>
<td align="center">
<bold>7.30079E-11</bold>
</td>
</tr>
<tr>
<td align="left">
<italic>Gnetum gnemon</italic>
</td>
<td align="char" char=".">112</td>
<td align="char" char=".">0.057119</td>
<td align="center">5.09991E-10</td>
<td align="char" char=".">0.027154</td>
<td align="center">2.42446E-10</td>
</tr>
<tr>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">112</td>
<td align="char" char=".">0.126746</td>
<td align="center">1.13166E-09</td>
<td align="char" char=".">0.073152</td>
<td align="center">6.53143E-10</td>
</tr>
<tr>
<td align="left">
<bold>Gnetophytes</bold>
</td>
<td align="char" char=".">
<bold>252</bold>
</td>
<td align="char" char=".">
<bold>0.053585</bold>
</td>
<td align="center">
<bold>2.12639E-10</bold>
</td>
<td align="char" char=".">
<bold>0.019649</bold>
</td>
<td align="center">
<bold>7.79722E-11</bold>
</td>
</tr>
<tr>
<td align="left">
<italic>Picea abies</italic>
</td>
<td align="char" char=".">25</td>
<td align="char" char=".">0.005778</td>
<td align="center">2.31120E-10</td>
<td align="char" char=".">0.005871</td>
<td align="center">2.34840E-10</td>
</tr>
<tr>
<td align="left">
<italic>Picea glauca</italic>
</td>
<td align="char" char=".">25</td>
<td align="char" char=".">0.046808</td>
<td align="center">1.87232E-09</td>
<td align="char" char=".">0.032513</td>
<td align="center">1.30052E-09</td>
</tr>
<tr>
<td align="left">
<italic>Pinus lambertiana</italic>
</td>
<td align="char" char=".">72</td>
<td align="char" char=".">0.005949</td>
<td align="center">8.26250E-11</td>
<td align="char" char=".">0.005264</td>
<td align="center">7.31111E-11</td>
</tr>
<tr>
<td align="left">
<italic>Pinus taeda</italic>
</td>
<td align="char" char=".">72</td>
<td align="char" char=".">0.007723</td>
<td align="center">1.07264E-10</td>
<td align="char" char=".">0.004264</td>
<td align="center">5.92222E-11</td>
</tr>
<tr>
<td align="left">
<italic>Abies sibirica</italic>
</td>
<td align="char" char=".">154</td>
<td align="char" char=".">0.069804</td>
<td align="center">4.53273E-10</td>
<td align="char" char=".">0.054221</td>
<td align="center">3.52084E-10</td>
</tr>
<tr>
<td align="left">
<italic>Larix sibirica</italic>
</td>
<td align="char" char=".">133</td>
<td align="char" char=".">0.031210</td>
<td align="center">2.34662E-10</td>
<td align="char" char=".">0.007401</td>
<td align="center">5.56466E-11</td>
</tr>
<tr>
<td align="left">
<bold>Pinaceae</bold>
</td>
<td align="char" char=".">
<bold>265</bold>
</td>
<td align="char" char=".">
<bold>0.009825</bold>
</td>
<td align="center">
<bold>3.70755E-11</bold>
</td>
<td align="char" char=".">
<bold>0.004160</bold>
</td>
<td align="center">
<bold>1.56981E-11</bold>
</td>
</tr>
<tr>
<td align="left">
<bold>
<italic>Ginkgo biloba</italic>
</bold>
</td>
<td align="char" char=".">
<bold>287</bold>
</td>
<td align="char" char=".">
<bold>0.035716</bold>
</td>
<td align="center">
<bold>1.24446E-10</bold>
</td>
<td align="char" char=".">
<bold>0.007753</bold>
</td>
<td align="center">
<bold>2.70139E-11</bold>
</td>
</tr>
<tr>
<td align="left">
<italic>Ceratozamia hildae</italic>
</td>
<td align="char" char=".">41</td>
<td align="char" char=".">0.003389</td>
<td align="center">8.26585E-11</td>
<td align="char" char=".">0.000312</td>
<td align="center">7.60976E-12</td>
</tr>
<tr>
<td align="left">
<italic>Zamia integrifolia</italic>
</td>
<td align="char" char=".">41</td>
<td align="char" char=".">0.011686</td>
<td align="center">2.85024E-10</td>
<td align="char" char=".">0.009431</td>
<td align="center">2.30024E-10</td>
</tr>
<tr>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="char" char=".">194</td>
<td align="char" char=".">0.003073</td>
<td align="center">1.58402E-11</td>
<td align="char" char=".">0.001835</td>
<td align="center">9.45876E-12</td>
</tr>
<tr>
<td align="left">
<bold>Cycads</bold>
</td>
<td align="char" char=".">
<bold>305</bold>
</td>
<td align="char" char=".">
<bold>0.026821</bold>
</td>
<td align="center">
<bold>8.79377E-11</bold>
</td>
<td align="char" char=".">
<bold>0.005682</bold>
</td>
<td align="center">
<bold>1.86295E-11</bold>
</td>
</tr>
<tr>
<td align="left">
<italic>Amborella trichopoda</italic>
</td>
<td align="char" char=".">117</td>
<td align="char" char=".">0.025430</td>
<td align="center">2.17350E-10</td>
<td align="char" char=".">0.010369</td>
<td align="center">8.86239E-11</td>
</tr>
<tr>
<td align="left">
<italic>Liriodendron tulipifera</italic>
</td>
<td align="char" char=".">117</td>
<td align="char" char=".">0.026193</td>
<td align="center">2.23872E-10</td>
<td align="char" char=".">0.009041</td>
<td align="center">7.72735E-11</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Bold values are summary of each major clade including the taxa sampled within the clade.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Moreover, we calculated the absolute substitution rates R<italic>S</italic> and R<italic>N</italic> per branch by adjusting the d<italic>S</italic> and d<italic>N</italic> by dividing the divergence time of the branch. Again, R<italic>S</italic> and R<italic>N</italic> varied up to 118- and 171-fold among species, respectively, with the highest R<italic>S</italic> and R<italic>N</italic> in Cupressophytes and Gnetophytes, and the lowest in Pinaceae. Within Cupressophytes, R<italic>S</italic> and R<italic>N</italic> varied by 40-fold and 70-fold, with <italic>P. orientalis</italic> having the lowest rates (<xref ref-type="table" rid="T3">Table 3</xref>). This wide range of substitution rates indicates that sequence evolution is heterogeneous within and among plant lineages, especially in Cupressophytes.</p>
</sec>
<sec id="s3-3">
<title>3.3 Mitochondrial Gene Loss and Transfer to Nucleus in Cupressophytes and Gnetophytes</title>
<p>Early studies suggest that the mitogenome of the common ancestor of seed plants probably contained 41 protein-coding genes (<xref ref-type="bibr" rid="B44">Richardson et al., 2013</xref>; <xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>). We found all 41 genes in Cycads, Ginkgo and Pinaceae, but 8&#x2013;12 genes were absent in Cupressophytes and Gnetophytes (white and orange boxes in <xref ref-type="fig" rid="F2">Figure 2B</xref>). All species in Cupressophytes have lost the same set of eight ribosomal protein genes, while Cupressaceae species and <italic>T. cuspidata</italic> lost an additional <italic>sdh3</italic> gene (<xref ref-type="fig" rid="F2">Figure 2B</xref>). In Gnetophytes, both <italic>G. gnemon</italic> and <italic>W. mirabilis</italic> have lost 11 genes, including 10 ribosomal protein genes and the <italic>sdh3</italic> gene; their <italic>rpl</italic>16 appeared as degraded pseudogene (<xref ref-type="fig" rid="F2">Figure 2B</xref>).</p>
<p>The reduction in mitochondrial protein-coding genes in Cupressophytes and Gnetophytes has been suggested to be a result of gene transfer to the nucleus prior to their loss from the mitogenome (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B15">Guo et al., 2020</xref>). To verify whether the lost genes were transferred to the nucleus, we first searched for them in the transcriptomes of Cupressophytes and Gnetophytes (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). We recovered 4&#x2013;7 intact lost mitochondrial genes in transcriptomes of each respective species, but none in <italic>A. heterophylla</italic> (<xref ref-type="fig" rid="F2">Figure 2B</xref>). The recovery of few intact mitochondrial genes in <italic>A. heterophylla</italic> is likely to be a consequence of the limited numbers of ESTs or cDNA sequences in the database, which would hamper detection of these genes in its nuclear genome. We then searched for these recovered genes in their own or related species&#x2019; reference genomes and found all of them with high identity (89&#x2013;100%) and coverage (85&#x2013;100%) scores (<xref ref-type="sec" rid="s11">Supplementary Table S3</xref>). There were a few exceptions, e.g., <italic>rps</italic>11 and <italic>sdh</italic>3 showed lower identity (52&#x2013;75%) but high coverage (92&#x2013;100%) scores, likely due to different substitution rates between genes and species. The BLAST hits of <italic>Podocarpus macrophyllus</italic> genes gave moderate identity scores (48&#x2013;81%) likely because of the lack of closely related reference. We further analyzed the mapping depth of genome resequencing reads to the mitogenes and transcriptome-recovered genes in each Cupressophytes and Gnetophytes species. In <italic>P. orientalis</italic>, the median depth of read coverage of the 32 genes in mitogenome ranged 275&#x2013;1,169&#xd7;, while the nuclear gene <italic>LEAFY</italic> had 15&#xd7; and the chloroplast <italic>matK</italic> 14,395&#xd7; (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>). The six recovered mitogenes had median depth of read coverage 11&#x2013;17&#xd7;, similar to the <italic>LEAFY</italic>, supporting their location in nucleus. Using the same approach, we confirmed that 4&#x2013;7 of the lost genes in the seven other species of Cupressophytes and Gnetophytes were transferred to the nucleus (orange boxes in <xref ref-type="fig" rid="F2">Figure 2B</xref>). Our results illustrate the differential abundance of nuclear, mitochondrial and plastid genomes in plant cells, and demonstrate the power of depth of read coverage as a quantitative tool for verification of genome origin of a gene.</p>
</sec>
<sec id="s3-4">
<title>3.4 Sequence Turnover and Structural Rearrangement in Gymnosperm Mitogenomes</title>
<p>Rapid structural evolution is thought to be characteristic of plant mitogenomes (<xref ref-type="bibr" rid="B39">Palmer and Herbon, 1988</xref>; <xref ref-type="bibr" rid="B5">Cole et al., 2018</xref>). To understand the rate of sequence turnover and structural rearrangement in gymnosperms, we examined the degree of synteny and shared DNA among the mitogenomes of the main gymnosperms lineages. We found that syntenic blocks and shared DNA between genomes reduced rapidly with phylogenetic distance (<xref ref-type="fig" rid="F3">Figures 3A&#x2013;D</xref>; <xref ref-type="table" rid="T4">Table 4</xref>). For example, <italic>P. orientalis</italic> and <italic>C. sempervirens</italic> diversified for 87&#xa0;million years (MY) shared &#x223c;60% DNA sequence, but this value dropped sharply to only &#x223c;10% between <italic>P. macrophyllus</italic> and <italic>A. heterophylla</italic> with a divergence time of 126 MY (<xref ref-type="fig" rid="F3">Figures 3A,C</xref>; <xref ref-type="table" rid="T4">Table 4</xref>). We examined the patterns of shared DNA between 16 pairs of gymnosperm species, and found a strong negative correlation (<italic>r</italic> &#x3d; 0.53, <italic>p</italic> &#x3d; 0.03) with time of divergence (<xref ref-type="fig" rid="F3">Figure 3F</xref>). However, as an outlier, exceptionally low DNA turnover was found between <italic>G. biloba</italic> and <italic>C. taitungensis</italic> (<xref ref-type="table" rid="T4">Table 4</xref>), similar to the report by <xref ref-type="bibr" rid="B14">Guo et al. (2016)</xref>. In addition, high proportions of shared DNA (58&#x2013;64%) were retained between <italic>C. taitungensis</italic> and <italic>Ceratozamia hildae</italic>/<italic>Zamia integrifolia</italic> with the divergence time of 194 MY (<xref ref-type="fig" rid="F3">Figure 3E</xref>; <xref ref-type="table" rid="T4">Table 4</xref>). These results illustrate a variable rate of mitogenome turnover in gymnosperms.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Mitogenome alignments between gymnosperm species showing the locally collinear blocks at varying divergence time. <bold>(A)</bold> <italic>Platycladus orientalis vs. Cupressus sempervirens</italic>. <bold>(B)</bold> <italic>Cupressus sempervirens vs. Hesperocyparis glabra</italic>. <bold>(C)</bold> <italic>Podocarpus macrophyllus vs. Araucaria heterophylla</italic>. <bold>(D)</bold> <italic>Gnetum gnemon vs. Welwitschia mirabilis</italic>. <bold>(E)</bold> <italic>Cycas taitungensis vs. Ceratozamia hildae</italic>. The color bars represent corresponding local collinear blocks, heights are proportional to pairwise sequence identity, and blocks below the center line indicate regions that align in the reverse complement (inverse) orientation. MYA, million years ago. <bold>(F)</bold> Correlation between divergence time and the degree of shared sequences. The blue line represents the regression fitting with a linear model. The grey shadow is the 95% confidence interval of the linear regression.</p>
</caption>
<graphic xlink:href="fgene-13-867736-g003.tif"/>
</fig>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Amount of shared mitochondrial DNA in gymnosperms spanning a wide range of divergence times. MYA, million years ago.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" colspan="2" align="left">Species compared</th>
<th rowspan="3" align="center">Divergence time (MYA)</th>
<th colspan="7" align="center">Shared sequence</th>
</tr>
<tr>
<th colspan="3" align="center">Length (Kb)</th>
<th colspan="4" align="center">%Genome</th>
</tr>
<tr>
<th align="left">Species 1</th>
<th align="center">Species 2</th>
<th align="center">S1 to S2</th>
<th align="center">S2 to S1</th>
<th align="center">Mean</th>
<th align="center">S1</th>
<th align="center">S2</th>
<th align="center">Mean</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="left">
<italic>Cupressus sempervirens</italic>
</td>
<td align="char" char=".">87</td>
<td align="center">1,573</td>
<td align="center">1,599</td>
<td align="center">1,586</td>
<td align="char" char=".">60.0</td>
<td align="char" char=".">58.3</td>
<td align="char" char=".">59.2</td>
</tr>
<tr>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="left">
<italic>Podocarpus macrophyllus</italic>
</td>
<td align="char" char=".">226</td>
<td align="center">78</td>
<td align="center">99</td>
<td align="center">88</td>
<td align="char" char=".">3.0</td>
<td align="char" char=".">4.9</td>
<td align="char" char=".">4.0</td>
</tr>
<tr>
<td align="left">
<italic>Cupressus sempervirens</italic>
</td>
<td align="left">
<italic>Hesperocyparis glabra</italic>
</td>
<td align="char" char=".">31</td>
<td align="center">1,311</td>
<td align="center">1,344</td>
<td align="center">1,328</td>
<td align="char" char=".">47.8</td>
<td align="char" char=".">68.4</td>
<td align="char" char=".">58.1</td>
</tr>
<tr>
<td align="left">
<italic>Podocarpus macrophyllus</italic>
</td>
<td align="left">
<italic>Araucaria heterophylla</italic>
</td>
<td align="char" char=".">126</td>
<td align="center">156</td>
<td align="center">157</td>
<td align="center">156</td>
<td align="char" char=".">7.7</td>
<td align="char" char=".">11.4</td>
<td align="char" char=".">9.6</td>
</tr>
<tr>
<td align="left">
<italic>Gnetum gnemon</italic>
</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">112</td>
<td align="center">54</td>
<td align="center">53</td>
<td align="center">54</td>
<td align="char" char=".">8.5</td>
<td align="char" char=".">5.4</td>
<td align="char" char=".">7.0</td>
</tr>
<tr>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">252</td>
<td align="center">31</td>
<td align="center">46</td>
<td align="center">38</td>
<td align="char" char=".">1.2</td>
<td align="char" char=".">4.7</td>
<td align="char" char=".">3.0</td>
</tr>
<tr>
<td align="left">
<italic>Picea abies</italic>
</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">265</td>
<td align="center">39</td>
<td align="center">54</td>
<td align="center">46</td>
<td align="char" char=".">0.8</td>
<td align="char" char=".">5.6</td>
<td align="char" char=".">3.2</td>
</tr>
<tr>
<td align="left">
<italic>Picea abies</italic>
</td>
<td align="left">
<italic>Picea glauca</italic>
</td>
<td align="char" char=".">25</td>
<td align="center">3,808</td>
<td align="center">3,658</td>
<td align="center">3,733</td>
<td align="char" char=".">77.7</td>
<td align="char" char=".">61.0</td>
<td align="char" char=".">69.4</td>
</tr>
<tr>
<td align="left">
<italic>Pinus lambertiana</italic>
</td>
<td align="left">
<italic>Pinus taeda</italic>
</td>
<td align="char" char=".">72</td>
<td align="center">677</td>
<td align="center">855</td>
<td align="center">766</td>
<td align="char" char=".">16.9</td>
<td align="char" char=".">71.8</td>
<td align="char" char=".">44.4</td>
</tr>
<tr>
<td align="left">
<italic>Abies sibirica</italic>
</td>
<td align="left">
<italic>Pinus taeda</italic>
</td>
<td align="char" char=".">154</td>
<td align="center">176</td>
<td align="center">167</td>
<td align="center">172</td>
<td align="char" char=".">11.9</td>
<td align="char" char=".">14.1</td>
<td align="char" char=".">13.0</td>
</tr>
<tr>
<td align="left">
<italic>Ginkgo biloba</italic>
</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">287</td>
<td align="center">37</td>
<td align="center">36</td>
<td align="center">36</td>
<td align="char" char=".">10.7</td>
<td align="char" char=".">3.7</td>
<td align="char" char=".">7.2</td>
</tr>
<tr>
<td align="left">
<italic>Ginkgo biloba</italic>
</td>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="char" char=".">305</td>
<td align="center">233</td>
<td align="center">226</td>
<td align="center">230</td>
<td align="char" char=".">67.5</td>
<td align="char" char=".">54.7</td>
<td align="char" char=".">61.1</td>
</tr>
<tr>
<td align="left">
<italic>Ceratozamia hildae</italic>
</td>
<td align="left">
<italic>Zamia integrifolia</italic>
</td>
<td align="char" char=".">41</td>
<td align="center">344</td>
<td align="center">319</td>
<td align="center">332</td>
<td align="char" char=".">83.7</td>
<td align="char" char=".">68.2</td>
<td align="char" char=".">76.0</td>
</tr>
<tr>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="left">
<italic>Ceratozamia hildae</italic>
</td>
<td align="char" char=".">194</td>
<td align="center">247</td>
<td align="center">278</td>
<td align="center">262</td>
<td align="char" char=".">59.7</td>
<td align="char" char=".">67.7</td>
<td align="char" char=".">63.7</td>
</tr>
<tr>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="left">
<italic>Zamia integrifolia</italic>
</td>
<td align="char" char=".">194</td>
<td align="center">244</td>
<td align="center">265</td>
<td align="center">254</td>
<td align="char" char=".">58.8</td>
<td align="char" char=".">56.6</td>
<td align="char" char=".">57.7</td>
</tr>
<tr>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char=".">305</td>
<td align="center">36</td>
<td align="center">36</td>
<td align="center">36</td>
<td align="char" char=".">8.9</td>
<td align="char" char=".">3.8</td>
<td align="char" char=".">6.4</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-5">
<title>3.5 Repetitive Sequences in Gymnosperm Mitogenomes</title>
<p>Repetitive sequences, particularly TEs, are important components of plant nuclear genomes and contribute to genome size variation and functional regulation (<xref ref-type="bibr" rid="B32">Mehrotra and Goyal, 2014</xref>). In contrast, TEs and other repetitive elements in plant mitogenomes are poorly characterized. In this study, we annotated TEs, tandem repeats, and dispersed repeats in the 20 mitogenomes, and found that they have a strong correlation with the genome size and are highly variable among species (<xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="table" rid="T5">Table 5</xref>). The highest proportion of TE is in <italic>A. sibirica</italic> (19.26%), followed by <italic>Z. integrifolia</italic> (15.57%), and the lowest in <italic>W. mirabilis</italic> (1.06%). TE contents vary widely even in the same clade, e.g. from 1.58% (<italic>P. macrophyllus</italic>) to 6.80% (<italic>H. glabra</italic>) in Cupressophytes, from 5.29% (<italic>P. lambertiana</italic>) to 19.26% (<italic>A. sibirica</italic>) in Pinaceae, and from 2.52% (<italic>C. taitungensis</italic>) to 15.57% (<italic>Z. integrifolia</italic>) in Cycads. Among TEs, LTRs (long terminal repeats) are the most common group followed by LINE (long interspersed nuclear elements) in most species (<xref ref-type="fig" rid="F4">Figure 4A</xref>). For the three Cupressaceae species and the two <italic>Pinus</italic> species, the most abundant element is the &#x201c;Unknown&#x201d; category (<xref ref-type="fig" rid="F4">Figure 4A</xref>). The &#x201c;Unknown&#x201d; category of TEs could be due to accumulation of various mutations over long evolutionary time that have degraded the TEs into sequences that cannot be properly classified.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Composition of repetitive sequences in gymnosperm mitogenomes. <bold>(A)</bold> The proportion of TE classes identified in each genome. LTR, long terminal repeat; LINE, long interspersed nuclear element; SINE, short interspersed element; DNA, DNA transposable element; Unknown, unclassified transposable element. <bold>(B)</bold> Correlation between mitogenome size and tandem repeat size, <bold>(C)</bold> TE size, <bold>(D)</bold> dispersed repeat size, and <bold>(E)</bold> repetitive sequence size. The blue line represents the regression fitting with a linear model. The grey shadow is the 95% confidence interval of the linear regression.</p>
</caption>
<graphic xlink:href="fgene-13-867736-g004.tif"/>
</fig>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Repetitive sequences in each mitogenome. Dispersed repeats are divided into small-size (&#x003c;100 bp), medium-size (100&#x2013;1,000 bp), and large-size (&#x2265;1,000 bp) classes. Note, overlapping repetitive sequences are counted only once when calculating their total size.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Species</th>
<th colspan="4" align="center">Repetitive sequences (Kb)</th>
<th colspan="4" align="center">Number of dispersed repeats</th>
</tr>
<tr>
<th align="center">All</th>
<th align="center">Tandem repeats</th>
<th align="center">Transposable elements</th>
<th align="center">Dispersed repeats</th>
<th align="center">All</th>
<th align="center">Small-size</th>
<th align="center">Medium-size</th>
<th align="center">Large-size</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Platycladus orientalis</italic>
</td>
<td align="char" char="(">608 (23.18%)</td>
<td align="char" char="(">123 (4.70%)</td>
<td align="char" char="(">157 (6.00%)</td>
<td align="char" char="(">541 (20.60%)</td>
<td align="center">7,634</td>
<td align="center">6,332</td>
<td align="center">1,269</td>
<td align="char" char=".">33</td>
</tr>
<tr>
<td align="left">
<italic>Cupressus sempervirens</italic>
</td>
<td align="char" char="(">649 (23.66%)</td>
<td align="char" char="(">68 (2.48%)</td>
<td align="char" char="(">62 (2.26%)</td>
<td align="char" char="(">594 (21.65%)</td>
<td align="center">21,162</td>
<td align="center">20,061</td>
<td align="center">1,101</td>
<td align="char" char=".">0</td>
</tr>
<tr>
<td align="left">
<italic>Hesperocyparis glabra</italic>
</td>
<td align="char" char="(">500 (25.42%)</td>
<td align="char" char="(">76 (3.85%)</td>
<td align="char" char="(">134 (6.80%)</td>
<td align="char" char="(">437 (22.24%)</td>
<td align="center">28,579</td>
<td align="center">26,598</td>
<td align="center">1,823</td>
<td align="char" char=".">158</td>
</tr>
<tr>
<td align="left">
<italic>Taxus cuspidata</italic>
</td>
<td align="char" char="(">96 (20.45%)</td>
<td align="char" char="(">33 (6.99%)</td>
<td align="char" char="(">12 (2.49%)</td>
<td align="char" char="(">72 (15.30%)</td>
<td align="center">1,157</td>
<td align="center">908</td>
<td align="center">247</td>
<td align="char" char=".">2</td>
</tr>
<tr>
<td align="left">
<italic>Podocarpus macrophyllus</italic>
</td>
<td align="char" char="(">202 (9.99%)</td>
<td align="char" char="(">19 (0.94%)</td>
<td align="char" char="(">32 (1.58%)</td>
<td align="char" char="(">167 (8.26%)</td>
<td align="center">1,927</td>
<td align="center">1,520</td>
<td align="center">397</td>
<td align="char" char=".">10</td>
</tr>
<tr>
<td align="left">
<italic>Araucaria heterophylla</italic>
</td>
<td align="char" char="(">230 (16.62%)</td>
<td align="char" char="(">45 (3.24%)</td>
<td align="char" char="(">42 (3.04%)</td>
<td align="char" char="(">178 (12.84%)</td>
<td align="center">2,546</td>
<td align="center">1,817</td>
<td align="center">723</td>
<td align="char" char=".">6</td>
</tr>
<tr>
<td align="left">
<italic>Gnetum gnemon</italic>
</td>
<td align="char" char="(">203 (31.75%)</td>
<td align="char" char="(">29 (4.60%)</td>
<td align="char" char="(">22 (3.49%)</td>
<td align="char" char="(">171 (26.75%)</td>
<td align="center">22,333</td>
<td align="center">19,944</td>
<td align="center">2,355</td>
<td align="char" char=".">34</td>
</tr>
<tr>
<td align="left">
<italic>Welwitschia mirabilis</italic>
</td>
<td align="char" char="(">86 (8.83%)</td>
<td align="char" char="(">24 (2.49%)</td>
<td align="char" char="(">10 (1.06%)</td>
<td align="char" char="(">61 (6.22%)</td>
<td align="center">822</td>
<td align="center">781</td>
<td align="center">41</td>
<td align="char" char=".">0</td>
</tr>
<tr>
<td align="left">
<italic>Picea abies</italic>
</td>
<td align="char" char="(">1,320 (26.95%)</td>
<td align="char" char="(">101 (2.07%)</td>
<td align="char" char="(">463 (9.46%)</td>
<td align="char" char="(">1,082 (22.09%)</td>
<td align="center">14,718</td>
<td align="center">11,856</td>
<td align="center">2,825</td>
<td align="char" char=".">37</td>
</tr>
<tr>
<td align="left">
<italic>Picea glauca</italic>
</td>
<td align="char" char="(">1,670 (27.86%)</td>
<td align="char" char="(">126 (2.10%)</td>
<td align="char" char="(">440 (7.33%)</td>
<td align="char" char="(">1,411 (23.54%)</td>
<td align="center">19,734</td>
<td align="center">15,853</td>
<td align="center">3,795</td>
<td align="char" char=".">86</td>
</tr>
<tr>
<td align="left">
<italic>Pinus lambertiana</italic>
</td>
<td align="char" char="(">1,079 (26.82%)</td>
<td align="char" char="(">80 (1.99%)</td>
<td align="char" char="(">213 (5.29%)</td>
<td align="char" char="(">950 (23.63%)</td>
<td align="center">134,961</td>
<td align="center">126,792</td>
<td align="center">8,157</td>
<td align="char" char=".">12</td>
</tr>
<tr>
<td align="left">
<italic>Pinus taeda</italic>
</td>
<td align="char" char="(">281 (23.58%)</td>
<td align="char" char="(">60 (5.04%)</td>
<td align="char" char="(">94 (7.93%)</td>
<td align="char" char="(">242 (20.30%)</td>
<td align="center">51,637</td>
<td align="center">41,842</td>
<td align="center">9,787</td>
<td align="char" char=".">8</td>
</tr>
<tr>
<td align="left">
<italic>Larix sibirica</italic>
</td>
<td align="char" char="(">3,899 (33.44%)</td>
<td align="char" char="(">132 (1.13%)</td>
<td align="char" char="(">1,052 (9.02%)</td>
<td align="char" char="(">3,293 (28.23%)</td>
<td align="center">150,913</td>
<td align="center">100,388</td>
<td align="center">50,404</td>
<td align="char" char=".">121</td>
</tr>
<tr>
<td align="left">
<italic>Abies sibirica</italic>
</td>
<td align="char" char="(">568 (38.24%)</td>
<td align="char" char="(">24 (1.60%)</td>
<td align="char" char="(">286 (19.26%)</td>
<td align="char" char="(">469 (31.54%)</td>
<td align="center">2,712</td>
<td align="center">1,299</td>
<td align="center">1,195</td>
<td align="char" char=".">218</td>
</tr>
<tr>
<td align="left">
<italic>Ginkgo biloba</italic>
</td>
<td align="char" char="(">49 (14.13%)</td>
<td align="char" char="(">4 (1.04%)</td>
<td align="char" char="(">11 (3.21%)</td>
<td align="char" char="(">38 (10.92%)</td>
<td align="center">2,712</td>
<td align="center">2,685</td>
<td align="center">24</td>
<td align="char" char=".">3</td>
</tr>
<tr>
<td align="left">
<italic>Ceratozamia hildae</italic>
</td>
<td align="char" char="(">106 (25.84%)</td>
<td align="char" char="(">9 (2.24%)</td>
<td align="char" char="(">56 (13.56%)</td>
<td align="char" char="(">89 (21.72%)</td>
<td align="center">3,054</td>
<td align="center">2,404</td>
<td align="center">643</td>
<td align="char" char=".">7</td>
</tr>
<tr>
<td align="left">
<italic>Zamia integrifolia</italic>
</td>
<td align="char" char="(">168 (35.76%)</td>
<td align="char" char="(">9 (1.95%)</td>
<td align="char" char="(">73 (15.57%)</td>
<td align="char" char="(">150 (31.92%)</td>
<td align="center">3,390</td>
<td align="center">2,478</td>
<td align="center">831</td>
<td align="char" char=".">81</td>
</tr>
<tr>
<td align="left">
<italic>Cycas taitungensis</italic>
</td>
<td align="char" char="(">122 (29.30%)</td>
<td align="char" char="(">22 (5.40%)</td>
<td align="char" char="(">10 (2.52%)</td>
<td align="char" char="(">111 (26.75%)</td>
<td align="center">42,039</td>
<td align="center">31,747</td>
<td align="center">10,285</td>
<td align="char" char=".">7</td>
</tr>
<tr>
<td align="left">
<italic>Amborella trichopoda</italic>
</td>
<td align="char" char="(">1,068 (27.62%)</td>
<td align="char" char="(">71 (1.83%)</td>
<td align="char" char="(">241 (6.24%)</td>
<td align="char" char="(">907 (23.47%)</td>
<td align="center">142,369</td>
<td align="center">113,064</td>
<td align="center">29,249</td>
<td align="char" char=".">56</td>
</tr>
<tr>
<td align="left">
<italic>Liriodendron tulipifera</italic>
</td>
<td align="char" char="(">116 (20.94%)</td>
<td align="char" char="(">2 (0.36%)</td>
<td align="char" char="(">39 (7.02%)</td>
<td align="char" char="(">83 (15.02%)</td>
<td align="center">669</td>
<td align="center">564</td>
<td align="center">99</td>
<td align="char" char=".">6</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In addition to TEs, dispersed repeats, including inverted and direct orientation duplicated sequences, are prevalent and made up to 20&#x2013;30% of the mitogenomes, with a few exceptions (<xref ref-type="table" rid="T5">Table 5</xref>). The highest proportion is found in Cycads (22&#x2013;32%) and <italic>A. sibirica</italic> in Pinaceae (32%). The two species in Gnetophytes are highly variable in this regard with 6% in <italic>W. mirabilis</italic> but 27% in <italic>G. gnemon</italic>; this value was stable (21&#x2013;22%) among the three taxa in Cupressaceae. Tandem repeats are a smaller component compared to dispersed repeats and TEs, and were observed at the level of 1&#x2013;5% in most of the mitogenomes (<xref ref-type="table" rid="T5">Table 5</xref>). The overall repetitive sequences composed 20&#x2013;38% of the analyzed mitogenomes with a few exceptions of 9&#x2013;17%, and show a strong correlation with genome size (<italic>r</italic> &#x3d; 0.99, <italic>p</italic> &#x3c; 0.0001; <xref ref-type="fig" rid="F4">Figure 4E</xref>; <xref ref-type="table" rid="T5">Table 5</xref>).</p>
</sec>
<sec id="s3-6">
<title>3.6 Accumulation and Elimination of Dispersed Repeats in Mitogenomes</title>
<p>To understand the dynamics of dispersed repeats in mitogenomes, we divided the repeats into small-, medium-, and large-size classes with lengths of &#x3c;100 bp, 100&#x2013;1,000&#xa0;bp, and &#x2265;1,000&#xa0;bp, respectively. We found that small-size repeats are the most abundant class in the 20 mitogenomes, followed by the medium-size repeats, while large-size repeats are rare (<xref ref-type="table" rid="T5">Table 5</xref>). The median lengths for the three classes are 52&#xa0;bp, 136&#xa0;bp, and 1,517&#xa0;bp, respectively. The number of small-size repeats are 2&#x2013;20 fold more common than medium-size repeats; <italic>G. biloba</italic> was extreme having 112-fold more small-size than medium-size repeats (<xref ref-type="table" rid="T5">Table 5</xref>). In <italic>A. sibirica</italic>, the two classes are balanced. Large-size dispersed repeats are limited, with 50% of the species containing fewer than 15 large repeats (<xref ref-type="table" rid="T5">Table 5</xref>). On the other hand, three species <italic>A. sibirica, H. glabra</italic> and <italic>L. sibirica</italic>, had more than 100 large repeats (<xref ref-type="table" rid="T5">Table 5</xref>). Thus, the density plots for small-size and medium-size repeats are similar among species, while it varied widely for the large-size repeats (<xref ref-type="fig" rid="F5">Figure 5A</xref>). The GC contents are relatively conserved for the three classes of dispersed repeats (<xref ref-type="fig" rid="F5">Figure 5B</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>The distribution of repeat size, GC content, and Kimuta 2-parameter (K2P) distance of dispersed repeats in each genome. <bold>(A)</bold> The density plot showing the length distribution of three classes of dispersed repeats. <bold>(B)</bold> The distribution of GC content in each size class. <bold>(C)</bold> The distribution of K2P distances among dispersed repeats. Repeats are grouped into small-size (&#x3c;100&#xa0;bp), medium-size (100&#x2013;1,000 bp) and large-size (&#x2265;1,000&#xa0;bp) classes. The K2P distance of 0 and 0.2 are shown with vertical red dash line<bold>s.</bold> Note, <italic>Taxus cuspidata</italic> contains two large-size dispersed repeats with K2P values of 0 and 0.0046, respectively, which failed to show in the density plot <bold>(C)</bold>
</p>
</caption>
<graphic xlink:href="fgene-13-867736-g005.tif"/>
</fig>
<p>To understand the tempo of evolution in dispersed repeats, we analyzed the distribution of K2P distances among the repeats in the 20 mitogenomes. Small values of K2P represent recent duplications while large values represent more ancient duplication events. We divided the K2P values into three distance classes: &#x223c;0 as recent duplications, &#x3e;0 and &#x3c;0.2 as intermediate events, and &#x3e;0.2 as ancient insertions. A K2P distribution with a dominant narrow peak indicates rapid accumulation of repeats in a short period, otherwise a flattened peak indicates a slow generation of repeats over a prolonged period. As shown in <xref ref-type="fig" rid="F5">Figure 5C</xref>, the K2P distributions of the small-size class is similar among all species with a dominant recent peak and lack of ancient insertions, suggesting they have been accumulated recently over a short time span. In contrast, the K2P distribution of the medium-size and large-size repeats are visibly different among species, often with two or three peaks spanning recent to ancient classes, suggesting multiple and distant expansion events.</p>
<p>Ancient dispersed repeats are easy to identify based on K2P distances, but they are not prevalent in the 20 mitogenomes. This may suggest that the persistance of ancient large-size repeats is governed by the rates of accumulation and elimination. Large repeats can be eliminated or broken down by repeat-mediated recombination, resulting in an increase in small- or medium-size repeats that appear to be more recent expansions (<xref ref-type="bibr" rid="B30">Mar&#xe9;chal and Brisson, 2010</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>).</p>
</sec>
</sec>
<sec id="s4">
<title>4 Discussion</title>
<p>Assembly of gymnosperm mitogenomes from genomic sequence data is challenging because of complex mechanisms contributing to structural and sequence variation, and lack of well-developed databases and tools for accurate genome mapping. Up to now, only &#x223c;20 gymnosperm mitogenomes have been released. This study contributes a complete mitogenome sequence for Cupressaceae and expands the coverage in gymnosperms. With this new genome, we performed in-depth comparative analyses among major gymnosperm lineages to understand the tempo and mode of mitogenome evolution.</p>
<sec id="s4-1">
<title>4.1 Heterogeneity in Repetitive Elements in Mitogenomes</title>
<p>Among the available gymnosperm mitogenomes, genome sizes vary markedly by 30-fold (<xref ref-type="table" rid="T1">Table 1</xref>). This large variation is hypothesized to be due to lineage- or species-specific accumulation of repetitive sequences, horizontal transfers and intergenomic transfers (<xref ref-type="bibr" rid="B12">Goremykin et al., 2012</xref>; <xref ref-type="bibr" rid="B43">Rice et al., 2013</xref>; <xref ref-type="bibr" rid="B16">Guo et al., 2017</xref>). It has been reported that 29&#x2013;100% of sequences in gymnosperm mitogenomes are similar to the nuclear genome sequences (<xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>). In <italic>P. orientalis</italic> we found 76% undefined sequences (<xref ref-type="table" rid="T2">Table 2</xref>), which could in part have been derived from the nucleus by intracellular transfer.</p>
<p>Another source of mitogenome size variation is repetitive sequences. Estimations of repetitive contents can be affected by filter and search criteria, e.g. setting the length to 50&#xa0;bp or 100&#xa0;bp could underestimate the full size range of repeats. In this study, we searched for dispersed repeats in all size classes. We found that dispersed repeats occupied 6&#x2013;32% and TEs 1&#x2013;19% in the sampled mitogenomes. The wide range of dispersed repeats content quantified in this study mirror the results of 1&#x2013;49% found in 82 angiosperms (<xref ref-type="bibr" rid="B9">Dong et al., 2018</xref>). All categories of repetitive sequences are strongly correlated with genome size, giving an overall relationship of <italic>r</italic> &#x3d; 0.99. Our results illustrate that repetitive sequences, especially TEs and dispersed repeats, are major components of mitogenome expansion.</p>
<p>Although a major component of mitogenomes, the size distributions of repetitive sequences and the dynamics of their accumulation have rarely been investigated in gymnosperms. We analyzed the frequency and sequence diversity of different size classes of repeats, and found small-size repeats are most common while large-size repeats are rare and vary widely among species. K2P distances among repeats indicate that most of the repeats have accumulated by recent expansions. Large-size repeats usually tend to recombine more frequently than small repeats (<xref ref-type="bibr" rid="B47">Skippington et al., 2015</xref>; <xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>), which may eliminate large repeats over time. However, in <italic>P. abies</italic>, most recombinogenic repeats are small- to medium-size, which deviates from the general expectation that, in the absence of other factors, recombination should scale positively with repeat length (<xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>). We are of the opinion that genome- or region-specific recombination rates could lead to unique sequence turnover rates resulting in the heterogeneous distribution of large repeats in mitogenomes.</p>
</sec>
<sec id="s4-2">
<title>4.2 Extensive Rearrangement and Sequence Turnover in Mitogenomes</title>
<p>The plant mitogenome is characterized by rapid structural rearrangement and sequence turnover, driven by a high recombination activity, making mtDNA highly variable even between closely related species (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B5">Cole et al., 2018</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>). In line with this view, extensive rearrangement is found between two spruce species, <italic>P. abies</italic> and <italic>P. glauca</italic> (<xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>). On the other hand, the mitogenomes of <italic>G. biloba</italic> and <italic>C. taitungensis</italic> have retained substantial amounts of shared DNA despite their divergence time &#x3e;300 MY (<xref ref-type="table" rid="T4">Table 4</xref>; <xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>). Even with these extreme cases, we found that the synteny blocks and shared DNA between mitogenomes generally decayed with divergence time, with a negative correlation <italic>r</italic> &#x3d; 0.53 (<italic>p</italic> &#x3d; 0.03) among the gymnosperms (<xref ref-type="fig" rid="F3">Figure 3F</xref>). Although not exhaustive, our analysis provides a quantitative estimation of the rate of sequence turnover in gymnosperm mitogenomes. Previous studies show that rearrangement in mitogenomes occurs largely through repeat-mediated recombination (<xref ref-type="bibr" rid="B5">Cole et al., 2018</xref>; <xref ref-type="bibr" rid="B62">Xia et al., 2020</xref>). However, the relationship between inter- and intra-molecule recombination and rearrangement rates among species is unclear (<xref ref-type="bibr" rid="B5">Cole et al., 2018</xref>). Recombination dynamics in plant mitogenomes are poorly understood to date and deserve further scrutiny as it drives sequence and structural evolution of plant mitogenomes, and affects genome integrity and biological function.</p>
</sec>
<sec id="s4-3">
<title>4.3 mtDNA Evidence Support Cupressophytes and Gnetophytes as Sister Groups</title>
<p>The phylogenetic placement of Gnetophytes differs among studies. Five conflicting hypotheses were supported by different marker systems and include: the Gnetophytes-other seed plant hypothesis, the Gnetophytes-other gymnosperm hypothesis, the Gnetifer (Gnetophytes &#x2b; Conifers) hypothesis, the Gnepine (Gnetophytes &#x2b; Pinaceae) hypothesis, and the GneCup (Gnetophytes &#x2b; Cupressophytes) hypothesis (<xref ref-type="bibr" rid="B42">Ran et al., 2018</xref>). Yet another suggestion is that Gnetophytes is sister to or within the conifers (<xref ref-type="bibr" rid="B56">Wan et al., 2018</xref>). The Gnepine hypothesis is favored by most studies (<xref ref-type="bibr" rid="B42">Ran et al., 2018</xref>), including a recent phylogeny based on mitochondrial protein-coding genes (<xref ref-type="bibr" rid="B22">Kan et al., 2021</xref>). On the other hand, plastid DNA strongly supports the GneCup hypothesis (<xref ref-type="bibr" rid="B45">Ruhfel et al., 2014</xref>; <xref ref-type="bibr" rid="B11">Gitzendanner et al., 2018</xref>; <xref ref-type="bibr" rid="B25">Leebens-Mack et al., 2019</xref>). This incongruence between datasets might be due to differences in the substitution rates of mitochondrial, plastid and nuclear genes, as well as the amount of informative sites included in each study.</p>
<p>In this study, we inferred the relationships among major gymnosperm lineages using 28 conserved protein-coding genes. The recovered phylogeny supports the GneCup hypothesis with a strong bootstrap support. We are more in favor of GneCup hypothesis because of the shared gene transfer pattern in these two clades. Over evolutionary time, some segments of mtDNA have diverged so much that groups of genes have been lost. The common ancestor of seed plants is inferred to contain 41 protein-coding genes (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B35">Mower, 2020</xref>), and Cycads, Ginkgo, and Pinaceae maintained this same set. The mitogenomes of Cupressophytes and Gnetophytes stand out from other gymnosperms in that both have lost 8&#x2013;11 ribosomal protein-coding genes and the <italic>sdh3</italic> gene, with the exception of <italic>Ephedra przewalskii</italic> (Gnetophytes) which has lost 19 genes (<xref ref-type="bibr" rid="B15">Guo et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Kan et al., 2021</xref>). To confirm whether these lost genes have been transferred to nucleus, we first annotated them in transcriptomes, then identified their homologs in nuclear genomes, and further examined their depth of mapped reads using genome resequencing data. All three lines of evidence support the transfer of 4&#x2013;7 mitogenes to nucleus. Our findings are in good agreement with the recent studies by <xref ref-type="bibr" rid="B21">Kan et al. (2020)</xref> and <xref ref-type="bibr" rid="B22">Kan et al. (2021)</xref>, in which they report finding 6&#x2013;8 intact or partial homologs of lost genes in the nuclear genomes. In sharp contrast, the three other lineages of gymnosperms, including Pinaceae, Ginkgo, and Cycads, share the same set of genes as the common ancestor more than 300 MYA (<xref ref-type="bibr" rid="B15">Guo et al., 2020</xref>). The unrecovered missing mitogenes could either be truly lost or not present in the transcriptomes we analyzed due to tissue- and/or time-specific expression, or incomplete annotation from transcriptomes, which identified the genes as partial homologs instead of intact genes.</p>
<p>Other striking characteristics of Cupressophyte and Gnetophyte mtDNA are their accelerated and hugely variable substitution rates across the 28 conserved protein-coding genes relative to other gymnosperms. The synonymous substitution rate d<italic>S</italic> in Cupressophytes and Gnetophytes averaged 0.0641 and 0.0536, respectively. After scaling up by divergence time, the absolute synonymous substitution rates R<italic>S</italic> were similar in Cupressophytes and Gnetophytes with 2.5 &#xd7; 10<sup>&#x2212;10</sup> and 2.1 &#xd7; 10<sup>&#x2212;10</sup> site/year, respectively, and are &#x223c;2&#x2013;7 fold higher than Pinaceae, Ginkgo, and Cycads. Previous work similarly inferred exceptionally low substitution rates in Pinaceae (<italic>Pinus</italic> and <italic>Picea</italic>) and higher substitution rates in Gnetophytes species (<xref ref-type="bibr" rid="B14">Guo et al., 2016</xref>; <xref ref-type="bibr" rid="B54">Sullivan et al., 2020</xref>; <xref ref-type="bibr" rid="B22">Kan et al., 2021</xref>). However, the extraordinary variation in R<italic>S</italic> in Cupressophytes and Gnetophytes is revealed only by denser sampling of taxa from each clade. Within Cupressophytes, R<italic>S</italic> varied 46-fold among taxa. Our results add to the recognition that while most plant mitogenomes show very low synonymous substitution rates, this rate of divergence is also exceptionally variable for reasons still unclear (<xref ref-type="bibr" rid="B34">Mower et al., 2007</xref>). Another unexpected finding is that within Gnetophytes, <italic>G. gnemon</italic> and <italic>W. mirabilis</italic> showed distinct species-specific RNA editing patters as 87&#x2013;91% of their editing sites differ from each other. Such a striking diversification in RNA editing is not observed within other clades. Future studies with broader taxa sampling are required to understand the mechanisms driving these patterns, including gene loss and transfer, TEs, recombination and selection.</p>
</sec>
</sec>
<sec id="s5">
<title>5 Conclusion</title>
<p>This study contributes a complete mitogenome assembly of <italic>P. orientalis</italic> to the still very limited accessions in gymnosperms. Our comparative analyses with 19 other mitogenomes of seed plants characterized the composition and distribution of repetitive elements, the tempo of sequence turnover and structural rearrangement, and the frequency of RNA editing in protein-coding genes. Our study revealed shared patterns of cyto-unclear gene transfer and accelerated substitution rates in Cupressophytes and Gnetophytes, and lend support to their sister group placement within the gymnosperms. Our findings highlight and reinforce the dynamic and enigmatic evolution of mitogenomes in gymnosperms.</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/genbank/,%20OL703044-OL703045">https://www.ncbi.nlm.nih.gov/genbank/, OL703044-OL703045</ext-link>.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>WZ, HL and X-RW designed the study; HL, WZ, R-GZ and J-FM generated and analyzed data; HL, WZ, and X-RW wrote the manuscript with contributions from all authors.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>This study was supported by grants from the National Natural Science Foundation of China (No. 32171816), and the Swedish Research Council (VR 2017-04686).</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of Interest</title>
<p>Author R-GZ was employed by the company Ori (Shandong) Gene Science and Technology Co., Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We thank Dr. Jeffrey Mower for sharing data with us, and Prof. Barbara Giles for valuable comments and linguistic editing. We also thank one of the reviewers for constructive suggestions that improved the clarity of the manuscript. Genomic data processing and analyses were performed using resources provided by the Swedish National Infrastructure for Computing (SNIC), through the High Performance Computing Centre North (HPC2N), Ume&#xe5; University.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2022.867736/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2022.867736/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Benson</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Tandem Repeats Finder: A Program to Analyze DNA Sequences</article-title>. <source>Nucleic Acids Res.</source> <volume>27</volume> (<issue>2</issue>), <fpage>573</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1093/nar/27.2.573</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaw</surname>
<given-names>S.-M.</given-names>
</name>
<name>
<surname>Chun-Chieh Shih</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.-W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>S.-M.</given-names>
</name>
<name>
<surname>Chou</surname>
<given-names>T.-Y.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The Mitochondrial Genome of the Gymnosperm <italic>Cycas Taitungensis</italic> Contains a Novel Family of Short Interspersed Elements, Bpu Sequences, and Abundant RNA Editing Sites</article-title>. <source>Mol. Biol. Evol.</source> <volume>25</volume> (<issue>3</issue>), <fpage>603</fpage>&#x2013;<lpage>615</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msn009</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Fastp: An Ultra-fast All-In-One FASTQ Preprocessor</article-title>. <source>Bioinformatics</source> <volume>34</volume> (<issue>17</issue>), <fpage>i884</fpage>&#x2013;<lpage>i890</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty560</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Chromosome-level Genome of Himalayan Yew Provides Insights into the Origin and Evolution of the Paclitaxel Biosynthetic Pathway</article-title>. <source>Mol. Plant</source> <volume>14</volume> (<issue>7</issue>), <fpage>1199</fpage>&#x2013;<lpage>1209</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2021.04.015</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cole</surname>
<given-names>L. W.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>High and Variable Rates of Repeat-Mediated Mitochondrial Genome Rearrangement in a Genus of Plants</article-title>. <source>Mol. Biol. Evol.</source> <volume>35</volume> (<issue>11</issue>), <fpage>2773</fpage>&#x2013;<lpage>2785</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msy176</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Criscuolo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Gribaldo</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>BMGE (Block Mapping and Gathering with Entropy): A New Software for Selection of Phylogenetic Informative Regions from Multiple Sequence Alignments</article-title>. <source>BMC Evol. Biol.</source> <volume>10</volume> (<issue>1</issue>), <fpage>210</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2148-10-210</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Darling</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Mau</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Perna</surname>
<given-names>N. T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>ProgressiveMauve: Multiple Genome Alignment with Gene Gain, Loss and Rearrangement</article-title>. <source>PLoS One</source> <volume>5</volume> (<issue>6</issue>), <fpage>e11147</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0011147</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De La Torre</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Van de Peer</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ingvarsson</surname>
<given-names>P. K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Contrasting Rates of Molecular Evolution and Patterns of Selection Among Gymnosperms and Flowering Plants</article-title>. <source>Mol. Biol. Evol.</source> <volume>34</volume> (<issue>6</issue>), <fpage>1363</fpage>&#x2013;<lpage>1377</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx069</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The Complete Mitochondrial Genome of the Early Flowering Plant <italic>Nymphaea Colorata</italic> Is Highly Repetitive with Low Recombination</article-title>. <source>BMC Genomics</source> <volume>19</volume> (<issue>1</issue>), <fpage>614</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-018-4991-4</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doyle</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Doyle</surname>
<given-names>J. L.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>A Rapid DNA Isolation Procedure for Small Quantities of Fresh Leaf Tissue</article-title>. <source>Phytochem. Bull.</source> <volume>19</volume>, <fpage>11</fpage>&#x2013;<lpage>15</lpage>. </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gitzendanner</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Soltis</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>G. K.-S.</given-names>
</name>
<name>
<surname>Ruhfel</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Soltis</surname>
<given-names>D. E.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Plastid Phylogenomic Analysis of Green Plants: A Billion Years of Evolutionary History</article-title>. <source>Am. J. Bot.</source> <volume>105</volume> (<issue>3</issue>), <fpage>291</fpage>&#x2013;<lpage>301</lpage>. <pub-id pub-id-type="doi">10.1002/ajb2.1048</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goremykin</surname>
<given-names>V. V.</given-names>
</name>
<name>
<surname>Lockhart</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Viola</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Velasco</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Mitochondrial Genome of <italic>Malus Domestica</italic> and the Import-Driven Hypothesis of Mitochondrial Genome Expansion in Seed Plants</article-title>. <source>Plant J.</source> <volume>71</volume> (<issue>4</issue>), <fpage>615</fpage>&#x2013;<lpage>626</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-313X.2012.05014.x</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grabherr</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Haas</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Yassour</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Levin</surname>
<given-names>J. Z.</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Amit</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Full-length Transcriptome Assembly from RNA-Seq Data without a Reference Genome</article-title>. <source>Nat. Biotechnol.</source> <volume>29</volume> (<issue>7</issue>), <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Grewe</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Knoop</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>
<italic>Ginkgo</italic> and <italic>Welwitschia</italic> Mitogenome Reveal Extreme Contrasts in Gymnosperm Mitochondrial Evolution</article-title>. <source>Mol. Biol. Evol.</source> <volume>33</volume> (<issue>6</issue>), <fpage>1448</fpage>&#x2013;<lpage>1460</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msw024</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Adams</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Extensive Shifts from <italic>Cis</italic>- to <italic>Trans</italic>-splicing of Gymnosperm Mitochondrial Introns</article-title>. <source>Mol. Biol. Evol.</source> <volume>37</volume> (<issue>6</issue>), <fpage>1615</fpage>&#x2013;<lpage>1620</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msaa029</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Complete Mitochondrial Genomes from the Ferns <italic>Ophioglossum Californicum</italic> and <italic>Psilotum Nudum</italic> Are Highly Repetitive with the Largest Organellar Introns</article-title>. <source>New Phytol.</source> <volume>213</volume> (<issue>1</issue>), <fpage>391</fpage>&#x2013;<lpage>403</lpage>. <pub-id pub-id-type="doi">10.1111/nph.14135</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>X.-G.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Y.-Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>
<italic>De Novo</italic> transcriptome Assembly and Characterization for the Widespread and Stress-Tolerant Conifer <italic>Platycladus Orientalis</italic>
</article-title>. <source>PLoS One</source> <volume>11</volume> (<issue>2</issue>), <fpage>e0148985</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0148985</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jackman</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Warren</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Gibb</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Vandervalk</surname>
<given-names>B. P.</given-names>
</name>
<name>
<surname>Mohamadi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Organellar Genomes of White Spruce (<italic>Picea glauca</italic>): Assembly and Annotation</article-title>. <source>Genome Biol. Evol.</source> <volume>8</volume> (<issue>1</issue>), <fpage>29</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evv244</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname>
<given-names>J.-J.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>W.-B.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>J.-B.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>dePamphilis</surname>
<given-names>C. W.</given-names>
</name>
<name>
<surname>Yi</surname>
<given-names>T.-S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>GetOrganelle: A Fast and Versatile Toolkit for Accurate <italic>De Novo</italic> Assembly of Organelle Genomes</article-title>. <source>Genome Biol.</source> <volume>21</volume> (<issue>1</issue>), <fpage>241</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-020-02154-5</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalyaanamoorthy</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Minh</surname>
<given-names>B. Q.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>T. K. F.</given-names>
</name>
<name>
<surname>von Haeseler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jermiin</surname>
<given-names>L. S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>ModelFinder: Fast Model Selection for Accurate Phylogenetic Estimates</article-title>. <source>Nat. Methods</source> <volume>14</volume> (<issue>6</issue>), <fpage>587</fpage>&#x2013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kan</surname>
<given-names>S.-L.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>T.-T.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ran</surname>
<given-names>J.-H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.-Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The Complete Mitochondrial Genome of <italic>Taxus Cuspidata</italic> (Taxaceae): Eight Protein-Coding Genes Have Transferred to the Nuclear Genome</article-title>. <source>BMC Evol. Biol.</source> <volume>20</volume> (<issue>1</issue>), <fpage>10</fpage>. <pub-id pub-id-type="doi">10.1186/s12862-020-1582-1</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kan</surname>
<given-names>S.-L.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>T.-T.</given-names>
</name>
<name>
<surname>Ran</surname>
<given-names>J.-H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.-Q.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Both Conifer II and Gnetales Are Characterized by a High Frequency of Ancient Mitochondrial Gene Transfer to the Nuclear Genome</article-title>. <source>BMC Biol.</source> <volume>19</volume> (<issue>1</issue>), <fpage>146</fpage>. <pub-id pub-id-type="doi">10.1186/s12915-021-01096-z</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kent</surname>
<given-names>W. J.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>BLAT-The BLAST-like Alignment Tool</article-title>. <source>Genome Res.</source> <volume>12</volume> (<issue>4</issue>), <fpage>656</fpage>&#x2013;<lpage>664</lpage>. <pub-id pub-id-type="doi">10.1101/gr.229202</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kimura</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1980</year>). <article-title>A Simple Method for Estimating Evolutionary Rates of Base Substitutions through Comparative Studies of Nucleotide Sequences</article-title>. <source>J. Mol. Evol.</source> <volume>16</volume> (<issue>2</issue>), <fpage>111</fpage>&#x2013;<lpage>120</lpage>. <pub-id pub-id-type="doi">10.1007/BF01731581</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leebens-Mack</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Barker</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Carpenter</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Deyholos</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Gitzendanner</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>S. W.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>One Thousand Plant Transcriptomes and the Phylogenomics of Green Plants</article-title>. <source>Nature</source> <volume>574</volume> (<issue>7780</issue>), <fpage>679</fpage>&#x2013;<lpage>685</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-019-1693-2</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Aligning Sequence Reads, Clone Sequences and Assembly Contigs with BWA-MEM</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1303.3997v2 [q-bio.GN]">https://arxiv.org/abs/1303.3997v2 [q-bio.GN]</ext-link> (Accessed June 21, 2018)</comment>. </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Minimap2: Pairwise Alignment for Nucleotide Sequences</article-title>. <source>Bioinformatics</source> <volume>34</volume> (<issue>18</issue>), <fpage>3094</fpage>&#x2013;<lpage>3100</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lo Giudice</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tangaro</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Pesole</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Picardi</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Investigating RNA Editing in Deep Transcriptome Datasets with REDItools and REDIportal</article-title>. <source>Nat. Protoc.</source> <volume>15</volume> (<issue>3</issue>), <fpage>1098</fpage>&#x2013;<lpage>1131</lpage>. <pub-id pub-id-type="doi">10.1038/s41596-019-0279-7</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lowe</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Eddy</surname>
<given-names>S. R.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>tRNAscan-SE: A Program for Improved Detection of Transfer RNA Genes in Genomic Sequence</article-title>. <source>Nucleic Acids Res.</source> <volume>25</volume> (<issue>5</issue>), <fpage>955</fpage>&#x2013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1093/nar/25.5.955</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mar&#xe9;chal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Brisson</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Recombination and the Maintenance of Plant Organelle Genome Stability</article-title>. <source>New Phytol.</source> <volume>186</volume> (<issue>2</issue>), <fpage>299</fpage>&#x2013;<lpage>317</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2010.03195.x</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marks</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Hotaling</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Frandsen</surname>
<given-names>P. B.</given-names>
</name>
<name>
<surname>VanBuren</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Representation and Participation across 20 Years of Plant Genome Sequencing</article-title>. <source>Nat. Plants</source> <volume>7</volume>, <fpage>1571</fpage>&#x2013;<lpage>1578</lpage>. <pub-id pub-id-type="doi">10.1038/s41477-021-01031-8</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mehrotra</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Goyal</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Repetitive Sequences in Plant Nuclear DNA: Types, Distribution, Evolution and Function</article-title>. <source>Genomics, Proteomics Bioinforma.</source> <volume>12</volume> (<issue>4</issue>), <fpage>164</fpage>&#x2013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1016/j.gpb.2014.07.003</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>PREP-mt: Predictive RNA Editor for Plant Mitochondrial Genes</article-title>. <source>BMC Bioinforma.</source> <volume>6</volume> (<issue>1</issue>), <fpage>96</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-6-96</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Touzet</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gummow</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Delph</surname>
<given-names>L. F.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Extensive Variation in Synonymous Substitution Rates in Mitochondrial Genes of Seed Plants</article-title>. <source>BMC Evol. Biol.</source> <volume>7</volume> (<issue>1</issue>), <fpage>135</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2148-7-135</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mower</surname>
<given-names>J. P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Variation in Protein Gene and Intron Content Among Land Plant Mitogenomes</article-title>. <source>Mitochondrion</source> <volume>53</volume>, <fpage>203</fpage>&#x2013;<lpage>213</lpage>. <pub-id pub-id-type="doi">10.1016/j.mito.2020.06.002</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neale</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Zimin</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Zaman</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Shrestha</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Workman</surname>
<given-names>R. E.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Assembled and Annotated 26.5 Gbp Coast Redwood Genome: A Resource for Estimating Evolutionary Adaptive Potential and Investigating Hexaploid Origin</article-title>. <source>G3 Genes|Genomes|Genetics</source> <volume>12</volume> (<issue>1</issue>), <fpage>jkab380</fpage>. <pub-id pub-id-type="doi">10.1093/g3journal/jkab380</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>L.-T.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Von Haeseler</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Minh</surname>
<given-names>B. Q.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>IQ-TREE: A Fast and Effective Stochastic Algorithm for Estimating Maximum-Likelihood Phylogenies</article-title>. <source>Mol. Biol. Evol.</source> <volume>32</volume> (<issue>1</issue>), <fpage>268</fpage>&#x2013;<lpage>274</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msu300</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nystedt</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Street</surname>
<given-names>N. R.</given-names>
</name>
<name>
<surname>Wetterbom</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zuccolo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Y.-C.</given-names>
</name>
<name>
<surname>Scofield</surname>
<given-names>D. G.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>The Norway Spruce Genome Sequence and Conifer Genome Evolution</article-title>. <source>Nature</source> <volume>497</volume> (<issue>7451</issue>), <fpage>579</fpage>&#x2013;<lpage>584</lpage>. <pub-id pub-id-type="doi">10.1038/nature12211</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Herbon</surname>
<given-names>L. A.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Plant Mitochondrial DNA Evolved Rapidly in Structure, but Slowly in Sequence</article-title>. <source>J. Mol. Evol.</source> <volume>28</volume> (<issue>1</issue>), <fpage>87</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1007/BF02143500</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Petit</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Vendramin</surname>
<given-names>G. G.</given-names>
</name>
</person-group> (<year>2007</year>). &#x201c;<article-title>Plant Phylogeography Based on Organelle Genes: an Introduction</article-title>,&#x201d; in <source>Phylogeography of Southern European Refugia: Evolutionary Perspectives on the Origins and Conservation of European Biodiversity</source>. Editors <person-group person-group-type="editor">
<name>
<surname>Weiss</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ferrandeds</surname>
<given-names>N.</given-names>
</name>
</person-group> (<publisher-loc>Dordrecht</publisher-loc>: <publisher-name>Springer Netherlands</publisher-name>), <fpage>23</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1007/1-4020-4904-8_2</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Putintseva</surname>
<given-names>Y. A.</given-names>
</name>
<name>
<surname>Bondar</surname>
<given-names>E. I.</given-names>
</name>
<name>
<surname>Simonov</surname>
<given-names>E. P.</given-names>
</name>
<name>
<surname>Sharov</surname>
<given-names>V. V.</given-names>
</name>
<name>
<surname>Oreshkova</surname>
<given-names>N. V.</given-names>
</name>
<name>
<surname>Kuzmin</surname>
<given-names>D. A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Siberian Larch (<italic>Larix Sibirica</italic> Ledeb.) Mitochondrial Genome Assembled Using Both Short and Long Nucleotide Sequence Reads Is Currently the Largest Known Mitogenome</article-title>. <source>BMC Genomics</source> <volume>21</volume> (<issue>1</issue>), <fpage>654</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-020-07061-4</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ran</surname>
<given-names>J.-H.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>T.-T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>M.-M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.-Q.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Phylogenomics Resolves the Deep Phylogeny of Seed Plants and Indicates Partial Convergent or Homoplastic Evolution between Gnetales and Angiosperms</article-title>. <source>Proc. R. Soc. B</source> <volume>285</volume> (<issue>1881</issue>), <fpage>20181012</fpage>. <pub-id pub-id-type="doi">10.1098/rspb.2018.1012</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rice</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Alverson</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Richardson</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Sanchez-Puerta</surname>
<given-names>M. V.</given-names>
</name>
<name>
<surname>Munzinger</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Horizontal Transfer of Entire Genomes via Mitochondrial Fusion in the Angiosperm <italic>Amborella</italic>
</article-title>. <source>Science</source> <volume>342</volume> (<issue>6165</issue>), <fpage>1468</fpage>&#x2013;<lpage>1473</lpage>. <pub-id pub-id-type="doi">10.1126/science.1246275</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Richardson</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Rice</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Alverson</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The &#x201c;Fossilized&#x201d; Mitochondrial Genome of <italic>Liriodendron Tulipifera</italic>: Ancestral Gene Content and Order, Ancestral Editing Sites, and Extraordinarily Low Mutation Rate</article-title>. <source>BMC Biol.</source> <volume>11</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1186/1741-7007-11-29</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruhfel</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Gitzendanner</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Soltis</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Soltis</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Burleigh</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>From Algae to Angiosperms-Inferring the Phylogeny of Green Plants (<italic>Viridiplantae</italic>) from 360 Plastid Genomes</article-title>. <source>BMC Evol. Biol.</source> <volume>14</volume> (<issue>1</issue>), <fpage>23</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2148-14-23</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scott</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Zimin</surname>
<given-names>A. V.</given-names>
</name>
<name>
<surname>Puiu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Workman</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Britton</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zaman</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>A Reference Genome Sequence for Giant Sequoia</article-title>. <source>G3 Genes|Genomes|Genetics</source> <volume>10</volume> (<issue>11</issue>), <fpage>3907</fpage>&#x2013;<lpage>3919</lpage>. <pub-id pub-id-type="doi">10.1534/g3.120.401612</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Skippington</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Barkman</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Rice</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Miniaturized Mitogenome of the Parasitic Plant <italic>Viscum Scurruloideum</italic> Is Extremely Divergent and Dynamic and Has Lost All <italic>Nad</italic> Genes</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>112</volume> (<issue>27</issue>), <fpage>E3515</fpage>&#x2013;<lpage>E3524</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1504491112</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slater</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Birney</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Automated Generation of Heuristics for Biological Sequence Comparison</article-title>. <source>BMC Bioinforma.</source> <volume>6</volume>, <fpage>31</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-6-31</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sloan</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Alverson</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Chuckalovcak</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>McCauley</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Palmer</surname>
<given-names>J. D.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>Rapid Evolution of Enormous, Multichromosomal Genomes in Flowering Plant Mitochondria with Exceptionally High Mutation Rates</article-title>. <source>PLoS Biol.</source> <volume>10</volume> (<issue>1</issue>), <fpage>e1001241</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pbio.1001241</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smit</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hubley</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>RepeatMasker Open-4.0. 2013-2015</article-title>. <comment>Available at: http://www.repeatmasker.org (accessed June 01, 2021)</comment>. </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smit</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hubley</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>RepeatModeler Open-1.0. 2008-2015</article-title>. <comment>Available at: http://www.repeatmasker.org (accessed June 01, 2021)</comment>. </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Keeling</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Mitochondrial and Plastid Genome Architecture: Reoccurring Themes, but Significant Differences at the Extremes</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>112</volume> (<issue>33</issue>), <fpage>10177</fpage>&#x2013;<lpage>10184</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1422049112</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stanke</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Diekhans</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Baertsch</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Haussler</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Using Native and Syntenically Mapped cDNA Alignments to Improve <italic>De Novo</italic> Gene Finding</article-title>. <source>Bioinformatics</source> <volume>24</volume> (<issue>5</issue>), <fpage>637</fpage>&#x2013;<lpage>644</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btn013</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sullivan</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Eldfjell</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Schiffthaler</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Delhomme</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Asp</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hebelstrup</surname>
<given-names>K. H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>The Mitogenome of Norway Spruce and a Reappraisal of Mitochondrial Recombination in Plants</article-title>. <source>Genome Biol. Evol.</source> <volume>12</volume> (<issue>1</issue>), <fpage>3586</fpage>&#x2013;<lpage>3598</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evz263</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Szmidt</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>M.-Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.-R.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Effects of RNA Editing on the <italic>coxI</italic> Evolution and Phylogeny Reconstruction</article-title>. <source>Euphytica</source> <volume>118</volume> (<issue>1</issue>), <fpage>9</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1023/A:1004046220115</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.-M.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.-F.</given-names>
</name>
<name>
<surname>Leitch</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Leitch</surname>
<given-names>I. J.</given-names>
</name>
<name>
<surname>Lohaus</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A Genome for Gnetophytes and Early Evolution of Seed Plants</article-title>. <source>Nat. Plants</source> <volume>4</volume> (<issue>2</issue>), <fpage>82</fpage>&#x2013;<lpage>89</lpage>. <pub-id pub-id-type="doi">10.1038/s41477-017-0097-2</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Leitch</surname>
<given-names>I. J.</given-names>
</name>
<name>
<surname>Xin</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Maggs-K&#xf6;lling</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The <italic>Welwitschia</italic> Genome Reveals a Unique Biology Underpinning Extreme Longevity in Deserts</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>4247</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-24528-4</pub-id> </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>X.-Q.</given-names>
</name>
<name>
<surname>Ran</surname>
<given-names>J.-H.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Evolution and Biogeography of Gymnosperms</article-title>. <source>Mol. Phylogenetics Evol.</source> <volume>75</volume>, <fpage>24</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2014.02.005</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wegrzyn</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Tearse</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Neale</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>TreeGenes: A Forest Tree Genome Database</article-title>. <source>Int. J. Plant Genomics</source> <volume>2008</volume>, <fpage>1</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1155/2008/412875</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wick</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Schultz</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Zobel</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Holt</surname>
<given-names>K. E.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Bandage: Interactive Visualization of <italic>De Novo</italic> Genome Assemblies</article-title>. <source>Bioinformatics</source> <volume>31</volume> (<issue>20</issue>), <fpage>3350</fpage>&#x2013;<lpage>3352</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv383</pub-id> </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z. Q.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>X. Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X. N.</given-names>
</name>
<name>
<surname>Tembrock</surname>
<given-names>L. R.</given-names>
</name>
<name>
<surname>Broz</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genomic Architectural Variation of Plant Mitochondria-A Review of Multichromosomal Structuring</article-title>. <source>J Sytematics Evol.</source> <volume>60</volume>, <fpage>160</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1111/jse.12655</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xia</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.-R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Microhomologies Are Associated with Tandem Duplications and Structural Variation in Plant Mitochondrial Genomes</article-title>. <source>Genome Biol. Evol.</source> <volume>12</volume> (<issue>11</issue>), <fpage>1965</fpage>&#x2013;<lpage>1974</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evaa172</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Bi</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The <italic>Taxus</italic> Genome Provides Insights into Paclitaxel Biosynthesis</article-title>. <source>Nat. Plants</source> <volume>7</volume> (<issue>8</issue>), <fpage>1026</fpage>&#x2013;<lpage>1036</lpage>. <pub-id pub-id-type="doi">10.1038/s41477-021-00963-5</pub-id> </citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>PAML 4: Phylogenetic Analysis by Maximum Likelihood</article-title>. <source>Mol. Biol. Evol.</source> <volume>24</volume> (<issue>8</issue>), <fpage>1586</fpage>&#x2013;<lpage>1591</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msm088</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>