<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2024.1339594</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Plasticity of repetitive sequences demonstrated by the complete mitochondrial genome of <italic>Eucalyptus camaldulensis</italic>
</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fukasawa</surname>
<given-names>Yoshinori</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2578894"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Driguez</surname>
<given-names>Patrick</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2623480"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bougouffa</surname>
<given-names>Salim</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/201975"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Carty</surname>
<given-names>Karen</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Putra</surname>
<given-names>Alexander</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2621255"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Cheung</surname>
<given-names>Ming-Sin</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2695117"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ermini</surname>
<given-names>Luca</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1251218"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Center for Bioscience Research and Education, Utsunomiya University</institution>, <addr-line>Utsunomiya</addr-line>, <country>Japan</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Core Labs, King Abdullah University of Science and Technology</institution>, <addr-line>Thuwal</addr-line>, <country>Saudi Arabia</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Computational Bioscience Research Center, King Abdullah University of Science and Technology</institution>, <addr-line>Thuwal</addr-line>, <country>Saudi Arabia</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>NORLUX NeuroOncology Laboratory, Department of Cancer Research, Luxembourg Institute of Health</institution>, <addr-line>Luxembourg</addr-line>, <country>Luxembourg</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Daojun Yuan, Huazhong Agricultural University, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Shin-ichi Arimura, The University of Tokyo, Japan</p>
<p>Tomohiko Kazama, Kyushu University, Japan</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Yoshinori Fukasawa, <email xlink:href="mailto:yoshinori.fukasawa@cc.utsunomiya-u.ac.jp">yoshinori.fukasawa@cc.utsunomiya-u.ac.jp</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>27</day>
<month>03</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>15</volume>
<elocation-id>1339594</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>11</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>03</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Fukasawa, Driguez, Bougouffa, Carty, Putra, Cheung and Ermini</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Fukasawa, Driguez, Bougouffa, Carty, Putra, Cheung and Ermini</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The tree <italic>Eucalyptus camaldulensis</italic> is a ubiquitous member of the <italic>Eucalyptus</italic> genus, which includes several hundred species. Despite the extensive sequencing and assembly of nuclear genomes from various eucalypts, the genus has only one fully annotated and complete mitochondrial genome (mitogenome). Plant mitochondria are characterized by dynamic genomic rearrangements, facilitated by repeat content, a feature that has hindered the assembly of plant mitogenomes. This complexity is evident in the paucity of available mitogenomes. This study, to the best of our knowledge, presents the first <italic>E. camaldulensis</italic> mitogenome. Our findings suggest the presence of multiple isomeric forms of the <italic>E. camaldulensis</italic> mitogenome and provide novel insights into minor rearrangements triggered by nested repeat sequences. A comparative sequence analysis of the <italic>E. camaldulensis</italic> and <italic>E. grandis</italic> mitogenomes unveils evolutionary changes between the two genomes. A significant divergence is the evolution of a large repeat sequence, which may have contributed to the differences observed between the two genomes. The largest repeat sequences in the <italic>E. camaldulensis</italic> mitogenome align well with significant yet unexplained structural variations in the <italic>E. grandis</italic> mitogenome, highlighting the adaptability of repeat sequences in plant mitogenomes.</p>
</abstract>
<kwd-group>
<kwd>mitochondrial genome</kwd>
<kwd>eucalyptus</kwd>
<kwd>repeat sequences</kwd>
<kwd>homologous recombination</kwd>
<kwd>nested repeat</kwd>
<kwd>isomer</kwd>
</kwd-group>
<contract-num rid="cn001">23K19338</contract-num>
<contract-sponsor id="cn001">Japan Society for the Promotion of Science<named-content content-type="fundref-id">10.13039/501100001691</named-content>
</contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="34"/>
<page-count count="11"/>
<word-count count="5760"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Plant Bioinformatics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Eucalyptus trees, known for their rapid growth rates, are increasingly recognized for their significant contribution to a sustainable economy. This is marked by the numerous nuclear reference genome assemblies of the <italic>Eucalyptus</italic> genus registered in NCBI (<xref ref-type="bibr" rid="B24">Myburg et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B31">Wang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B13">Driguez et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B21">L&#xf6;tter et&#xa0;al., 2022</xref>). Among several hundred species within this genus, <italic>Eucalyptus camaldulensis</italic>, river red gum, has the broadest geographical distribution (<xref ref-type="bibr" rid="B5">Butcher et&#xa0;al., 2002</xref>).</p>
<p>Using PacBio high-accuracy long-read (HiFi) sequencing, we have previously assembled the nuclear genome of <italic>E. camaldulensis</italic> and demonstrated that chromosome-scale assembly is feasible (<xref ref-type="bibr" rid="B13">Driguez et&#xa0;al., 2021</xref>). In contrast to the continuous assembly of the nuclear genome, there were numerous fragmented sequences that resembled organelle genomes. Due to the high degree of fragmentation, the mitogenome has not yet been determined. This issue extends beyond <italic>E. camaldulensis</italic> and represents a common challenge across different species of eucalypts. While multiple nuclear genomes are available, only one fully annotated mitogenome for <italic>E. grandis</italic> exists within the <italic>Eucalyptus</italic> genus (<xref ref-type="bibr" rid="B25">Pinard et&#xa0;al., 2019</xref>).</p>
<p>The mitochondria provide numerous essential pathways for eukaryotic cells, despite the fact that the majority of proteins are encoded by nuclear genomes (<xref ref-type="bibr" rid="B15">Fukasawa et&#xa0;al., 2015</xref>), which reflects the smaller size of mitochondrial genomes. Plant mitogenomes exhibit diverse evolutionary patterns, complicating assembly efforts despite their small size. Angiosperm mitogenomes show a considerable variation in size and gene content, ranging from 66 kb to 11.3 Mb, in contrast to the relatively stable size of plastid genomes (<xref ref-type="bibr" rid="B27">Sloan, 2013</xref>; <xref ref-type="bibr" rid="B29">Sun et&#xa0;al., 2022</xref>). Although angiosperm mitogenomes have low sequence evolution rates, the synteny conservation rates remain low due to frequent genome rearrangements (<xref ref-type="bibr" rid="B11">Cole et&#xa0;al., 2018</xref>). Such rearrangements, resulting from homologous recombination, play a significant role in plant mitogenome evolution.</p>
<p>Cross-ecotype comparisons of <italic>Arabidopsis</italic> plants revealed that disrupting the plant-specific <italic>MSH1</italic> gene results in stoichiometric changes and that polymorphisms among <italic>Arabidopsis</italic> ecotypes are caused by <italic>MSH1</italic>-regulated recombination (<xref ref-type="bibr" rid="B4">Arrieta-Montiel et&#xa0;al., 2009</xref>). A recent report also emphasizes the crucial role of <italic>MSH1</italic> in mitigating mutation rates in plant organelles (<xref ref-type="bibr" rid="B33">Wu et&#xa0;al., 2020</xref>). This distinctive genetic feature in plants indicates the high occurrences of homologous recombination-based rearrangements in plant mitogenomes, highlighting the need for analytical approaches different from those used for nuclear genomes (<xref ref-type="bibr" rid="B14">Fischer et&#xa0;al., 2022</xref>). The intricate rearrangement patterns observed in the study suggest the need for further methodological innovations in order to fully understand the dynamic nature of plant mitogenomes.</p>
<p>In this study, we assembled, for the first time, the complete mitogenome of <italic>E. camaldulensis</italic> using PacBio HiFi sequencing. Further validation of the assembled sequence was conducted using Oxford Nanopore Technologies (ONT) sequencing, which confirmed the existence of multiple forms of the mitogenome. Following the chloroplast/plastid (GenBank: CM024681.1) and nuclear (<xref ref-type="bibr" rid="B13">Driguez et&#xa0;al., 2021</xref>) genomes, the mitogenome of <italic>E. camaldulensi</italic>s, as presented in this study, represents the final piece of the entire genetic information of the species.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Genome assembly and annotation of mitogenome</title>
<p>PacBio Sequel-II raw subread data generated from the whole genome of <italic>E. camaldulensis</italic> was downloaded from NCBI and was used for the mitogenome assembly (SRX11929917). High Fidelity Circular Consensus reads (HiFi CCS) were locally called from the downloaded subread data using SMRTLink ver. 11.1. The first <italic>de novo</italic> assembly was computed using hifiasm ver. 0.16.1 (<xref ref-type="bibr" rid="B9">Cheng et&#xa0;al., 2021</xref>) against the whole PacBio HiFi dataset. Hereafter we refer to contigs computed by hifiasm as those computed with the whole-genome sequencing dataset, including nuclear genome assembly (<xref ref-type="bibr" rid="B13">Driguez et&#xa0;al., 2021</xref>). We searched mitogenome contigs with homology to the mitogenome of <italic>E. grandis</italic> (NCBI reference sequence: NC_040010.1). Because the collected contigs show different forms of the sequences, rearrangements mediated by repeat sequences were considered to explain multiple contigs (<xref ref-type="bibr" rid="B27">Sloan, 2013</xref>). Therefore, a repeat-aware graph assembler was applied to suppress this issue (<xref ref-type="bibr" rid="B14">Fischer et&#xa0;al., 2022</xref>). To accelerate computational time, mitochondria-derived reads were extracted from the original dataset using the <italic>E. grandis</italic> genome with minimum query coverage to the reference at 70% using minimap2 ver.2.26 (<xref ref-type="bibr" rid="B20">Li, 2018</xref>). We assembled the <italic>E. camaldulensis</italic> mitogenome using Flye ver. 2.8.3 with default parameters (<xref ref-type="bibr" rid="B19">Kolmogorov et&#xa0;al., 2019</xref>). The assembled mitogenome contig was annotated by using MITOFY ver. March 22, 2012 (<xref ref-type="bibr" rid="B3">Alverson et&#xa0;al., 2010</xref>) and tRNAscan-SE ver. 2 (<xref ref-type="bibr" rid="B6">Chan et&#xa0;al., 2021</xref>) with manual corrections to confirm the annotation. The genome circle map was drawn by using ORGDRAW ver. 1.3.1 (<xref ref-type="bibr" rid="B17">Greiner et&#xa0;al., 2019</xref>). The mitochondrial reads were reextracted from the entire dataset by mapping against reference sequences containing our mitogenome assembly, the nuclear genome (GCA_019915185.1), and the plastid genome (CM024681.1) for further analysis.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Repeat analysis</title>
<p>The direct repeat (DR) and inverted repeat (IR) contents of the <italic>E. camaldulensis</italic> mitogenome were analyzed using ROUSfinder ver. 2.0 and blastn ver. 2.14.1 (<xref ref-type="bibr" rid="B2">Altschul et&#xa0;al., 1997</xref>; <xref ref-type="bibr" rid="B34">Wynn and Christensen, 2019</xref>). Validation of the repeat-mediated genomic rearrangement was performed by mapping the mitochondria-derived reads against all possible sequences with the target repeat in the middle. Specifically, for each repeat pair detected by ROUSfinder, 3,000-bp flanking sequences upstream and downstream of the repeat sequence were extracted, and four sequences representing possible isomers mediated by homologous recombination were generated with the extracted flanking and the target repeat sequences. These generated sequences were combined as a reference set. The mitochondria-derived reads were mapped to the reference sequence set using minimap2 ver. 2.26, and supporting reads were counted for each repeat pair if a read is mapped to a sequence with at least 1,800-bp overlap to flanking sequences in both ends as a primary alignment. A few repeats are nested in another larger repeat sequence; however, the 1,800-bp threshold is long enough to detect unique sequences beyond the repeat sequence covering the target nested repeat (the largest covering repeat sequence has 1,467 bp in length). The assembly used for the repeat analysis was named Master Circle 1 form (MC1). It should be noted that because the rates of rearrangement mediated by the long (&gt;1,000 bp) repeat pairs were significant, we designated the rearranged MC1 sequence mediated by the longest repeat (repeat-1) as Master Circle 2 form (MC2). Additionally, the sequences of MC1 and MC2 rearranged by the second longest repeat (repeat-2) were termed MC1<sup>2</sup> and MC2<sup>2</sup>, respectively.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Sequence comparison</title>
<p>The mitogenomes of <italic>E. grandis</italic> and <italic>E. camaldulensis</italic> were compared using LAST ver. 1454 (<xref ref-type="bibr" rid="B18">Kie&#x142;basa et&#xa0;al., 2011</xref>) with default parameters. The MC2 of the <italic>E. camaldulensis</italic> mitogenome was selected as a representative sequence due to the least number of variations compared to the <italic>E. grandis</italic> mitogenome. Detected significant hits were visualized and summarized using the maf-convert command. Large rearrangements were visualized by using SyRI (<xref ref-type="bibr" rid="B16">Goel et&#xa0;al., 2019</xref>). An E-value of 1e-20 was used as the threshold.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Phylogenetic analysis</title>
<p>The taxonomic placement of <italic>E. camaldulensis</italic> was established by analyzing the complete mitochondrial genomes of all plant species within the <italic>Myrtaceae</italic> family available in the NCBI database. The complete genomes of <italic>E. grandis</italic>, <italic>Syzygium samarangense</italic>, and <italic>Rhodomyrtus tomentosa</italic> (accession numbers: NC_040010.1, NC_079700.1, and NC_071968.1, respectively) were downloaded. The complete mitochondrial genome of <italic>Begonia coptidifolia</italic> (accession number: LC706752.1) was used as an outgroup for rooting purposes. A multiple sequence alignment of five mitochondrial genomes, including <italic>E. camaldulensis</italic>, was generated using progressiveMauve with default parameters (<xref ref-type="bibr" rid="B12">Darling et&#xa0;al., 2010</xref>). Phylogenetic relationships were reconstructed using maximum likelihood with the general time reversible model. Initial trees for the heuristic search were obtained automatically by applying neighbor-joining and BioNJ algorithms to a matrix of pairwise distances estimated using the maximum composite likelihood approach and then selecting the topology with a superior log likelihood value. To model differences in the rates of evolution between sites, a discrete Gamma distribution was used. Positions containing missing/ambiguous data were excluded. An estimate of support for each branch was determined with the bootstrap test using 100 pseudoreplications. Phylogenetic analyses were conducted in MEGA11 (<xref ref-type="bibr" rid="B30">Tamura et&#xa0;al., 2021</xref>).</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Sample collection and HMW DNA extraction</title>
<p>Fresh <italic>E. camaldulensis</italic> leaves were collected from the research greenhouse at King Abdullah University of Science and Technology, Thuwal, Saudi Arabia. HMW DNA was extracted by following a modified Qiagen protocol (dx.doi.org/10.17504/protocols.io.bafmibk6).</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Oxford nanopore sequencing</title>
<p>This study utilized the GridION sequencer for Oxford Nanopore sequencing of <italic>E. camaldulensis</italic>. In preparation for library creation, short fragments were removed from the extracted HMW DNA using either BluePippin with a 30-kb cutoff or the Short Read Eliminator XL kit (SRE XL, Circulomics, Baltimore, MD, USA) as per the manufacturer&#x2019;s instructions. The size-selected DNA underwent a cleanup process with AMPure XP beads, followed by library processing using the genomic DNA by ligation protocol (SQK-LSK109, Oxford Nanopore, Oxford, UK). Specifically, DNA samples of <italic>E. camaldulensis</italic> (1.3 &#x3bc;g) were repaired and end-prepped before bead cleanup and adapter ligation. The ligated product underwent bead cleaning with long fragment buffer (LFB) and was subsequently eluted. The prepared library for <italic>E. camaldulensis</italic> (8 fmol) was loaded onto the GridION platform (FLO-MIN106D). This study extracted mitochondrial reads from the ONT dataset using the same criterion applied for the HiFi dataset. The duplex-like reads (i.e., reads mappable to the same region on the reference in two strands) were removed because they cannot be mapped lineally.</p>
</sec>
<sec id="s2_7">
<label>2.7</label>
<title>Validation of repeat-mediated rearrangements</title>
<p>The mitochondrial reads in both HiFi and ONT datasets were mapped against MC1 sequence. Only the reads that had 95% of their bases aligned linearly with the MC1 sequence were retained for coverage computation. Reads that were partially mapped, i.e., those with less than 95% of their bases were aligned linearly, were mapped against an alternative sequence, MC2<sup>2</sup>. This was done if a portion of the reads fully and linearly aligned with the alternative form but not with the reference sequence. To filter reads, CoverM ver. 0.7.0 was utilized (<ext-link ext-link-type="uri" xlink:href="https://github.com/wwood/CoverM">https://github.com/wwood/CoverM</ext-link>).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Structure of <italic>E. camaldulensis</italic> mitochondria genome</title>
<p>The assembled <italic>E. camaldulensis</italic> mitogenome is a single circular sequence of 463,134 bp, with an overall GC content of 45.11% (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). The mitogenome has a quadripartite structure that is characterized by a pair of long (8,986 bp) IR sequences (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S1</bold>
</xref>). Our findings suggest that a circular form, rather than the hypothetical linear structure previously discussed in the case of <italic>E. grandis</italic> (<xref ref-type="bibr" rid="B25">Pinard et&#xa0;al., 2019</xref>), is dominant in the mitogenome of <italic>E. camaldulensis</italic>. In our <italic>E. camaldulensis</italic> assembly, we did not find any results that support the linear structure. However, it should be noted that this does not exclude the possibility that the mitogenome contains a head-to-tail concatemer structure <italic>in vivo</italic> (<xref ref-type="bibr" rid="B27">Sloan, 2013</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Circular map of the <italic>E. camaldulensis</italic> mitochondrial genome. Genes inside the circle represent genes transcribed clockwise, and genes outside the circle are transcribed counterclockwise. Genes are categorized based on their functional classification, and the coloring schema is summarized in the center of the circle. The &#x201c;#&#x201d; symbol indicates genes that include introns. The inner circle shows the GC content of the genome.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g001.tif"/>
</fig>
<p>Annotations were made for 38 conventional protein-coding genes within the single circle model. In addition, 19 tRNA genes and five rRNA genes were observed (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>). The <italic>E. camaldulensis</italic> mitogenome seems to have lost <italic>rps2</italic> and <italic>rps1</italic> genes (<xref ref-type="bibr" rid="B1">Adams et&#xa0;al., 2002</xref>). Although fragmented homologous sequences of <italic>rps19</italic> were detected in the mitogenome, stop codons were also observed in the middle of the gene. Two copies of <italic>5S rRNA</italic> were found, which are also present in the mitogenome of <italic>E. grandis</italic>. Two copies of <italic>18S rRNA</italic> were also annotated on the <italic>E. camaldulensis</italic> mitogenome, which was previously described as a single copy gene in <italic>E. grandis</italic> mitogenome (<xref ref-type="bibr" rid="B25">Pinard et&#xa0;al., 2019</xref>). Overall, it appears that the gene content is well conserved between the two <italic>Eucalyptus</italic> mitogenomes.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Gene composition in the mitogenome of <italic>E. camaldulensis</italic>.</p>
</caption>
<table frame="hsides">
<tbody>
<tr>
<td valign="top" rowspan="3" align="left">Complex I</td>
<td valign="middle" align="left">nad1 (#)</td>
<td valign="middle" align="left">nad2 (#)</td>
<td valign="middle" align="left">nad3</td>
<td valign="middle" align="left">nad4 (#)</td>
</tr>
<tr>
<td valign="middle" align="left">nad4L</td>
<td valign="middle" align="left">nad5 (#)</td>
<td valign="middle" align="left">nad6</td>
<td valign="middle" align="left">nad7 (#)</td>
</tr>
<tr>
<td valign="middle" align="left">nad9</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" align="left">Complex II</td>
<td valign="middle" align="left">sdh3</td>
<td valign="middle" align="left">sdh4</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" align="left">Complex III</td>
<td valign="middle" align="left">cob</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" align="left">Complex IV</td>
<td valign="middle" align="left">cox1</td>
<td valign="middle" align="left">cox2 (#)</td>
<td valign="middle" align="left">cox3</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" rowspan="2" align="left">Complex V</td>
<td valign="middle" align="left">atp1</td>
<td valign="middle" align="left">atp4</td>
<td valign="middle" align="left">atp6</td>
<td valign="middle" align="left">atp8</td>
</tr>
<tr>
<td valign="middle" align="left">atp9</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" align="left">Cytochrome C biogenesis</td>
<td valign="middle" align="left">ccmB</td>
<td valign="middle" align="left">ccmC</td>
<td valign="middle" align="left">ccmFc (#)</td>
<td valign="middle" align="left">ccmFn</td>
</tr>
<tr>
<td valign="top" align="left">Ribosomal genes (small subunit)</td>
<td valign="middle" align="left">rpl2 (#)</td>
<td valign="middle" align="left">rpl5</td>
<td valign="middle" align="left">rpl10</td>
<td valign="middle" align="left">rpl16</td>
</tr>
<tr>
<td valign="top" rowspan="2" align="left">Ribosomal genes (large subunit)</td>
<td valign="middle" align="left">rps1</td>
<td valign="middle" align="left">rps3 (#)</td>
<td valign="middle" align="left">rps4</td>
<td valign="middle" align="left">rps7</td>
</tr>
<tr>
<td valign="middle" align="left">rps10</td>
<td valign="middle" align="left">rps12</td>
<td valign="middle" align="left">rps13</td>
<td valign="middle" align="left">rps14</td>
</tr>
<tr>
<td valign="top" align="left">Other</td>
<td valign="middle" align="left">matR</td>
<td valign="middle" align="left">mttB</td>
<td valign="middle" align="left"/>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" align="left">rRNA</td>
<td valign="middle" align="left">26S rRNA</td>
<td valign="middle" align="left">18S rRNA (x2)</td>
<td valign="middle" align="left">5S rRNA (x2)</td>
<td valign="middle" align="left"/>
</tr>
<tr>
<td valign="top" rowspan="4" align="left">tRNA</td>
<td valign="middle" align="left">tRNA-Asn (x2)</td>
<td valign="middle" align="left">tRNA-Asp</td>
<td valign="middle" align="left">tRNA-Cys</td>
<td valign="middle" align="left">tRNA-Gln</td>
</tr>
<tr>
<td valign="middle" align="left">tRNA-Glu</td>
<td valign="middle" align="left">tRNA-Gly</td>
<td valign="middle" align="left">tRNA-His (pl)</td>
<td valign="middle" align="left">tRNA-Ile (x2)</td>
</tr>
<tr>
<td valign="middle" align="left">tRNA-Lys</td>
<td valign="middle" align="left">tRNA-fMet</td>
<td valign="middle" align="left">tRNA-Met</td>
<td valign="middle" align="left">tRNA-Phe</td>
</tr>
<tr>
<td valign="middle" align="left">tRNA-Pro</td>
<td valign="middle" align="left">tRNA-Ser (x2)</td>
<td valign="middle" align="left">tRNA-Trp (pl)</td>
<td valign="middle" align="left">tRNA-Tyr</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The symbol &#x201c;(#)&#x201d; labels the genes that contain introns. tRNA genes like the plastid type are indicated by &#x201c;(pl)&#x201d;.</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Phylogeny of E. camaldulensis</title>
<p>To date, there are only three complete mitochondrial sequences from the <italic>Myrtaceae</italic> family being publicly available. For the sake of completeness, we performed a phylogenetic analysis to ascertain the phylogenetic placement of the <italic>E. camaldulensis</italic> mitogenome. The topology of the phylogenetic tree suggests a strong phylogenetic connection between the two eucalypt species, <italic>E. grandis</italic> and <italic>E. camaldulensis</italic> (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). The tree topology aligns with the phylogenetic tree inferred using mitogenomes by <xref ref-type="bibr" rid="B22">Lu and Li (2024)</xref>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Phylogeny of <italic>E. camaldulensis</italic> and rRNA gene conservation. <bold>(A)</bold> Phylogenetic relationship of <italic>E. camaldulensis</italic>, three <italic>Myrtaceae</italic> plants, and <italic>B. coptidifolia</italic> as an outgroup. The tree is based on the mitogenome sequences of the represented species, and the numbers on the tree nodes represent bootstrap values. <bold>(B)</bold> Relationship between <italic>18S rRNA</italic> and <italic>5S rRNA</italic> genes across five genomes, and their copy numbers are annotated on each mitogenome. The <italic>26S rRNA</italic> gene is also reported; for graphical purposes, only a single representation is used.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g002.tif"/>
</fig>
<p>The co-transcription and physical proximity of <italic>18S rRNA</italic> and <italic>5S rRNA</italic> in plant mitogenomes have been reported (<xref ref-type="bibr" rid="B8">Chen et&#xa0;al., 2017</xref>). Given the topology of the phylogeny, the varying copy numbers of these genes suggest multiple hypotheses for the evolution of these two genes on the mitogenome in the <italic>Myrtaceae</italic> family (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). The most parsimonious hypothesis is that a single duplication of <italic>5S rRNA</italic> occurred in a common ancestor of the two eucalypts, followed by a duplication of <italic>18S rRNA</italic> in the lineage of <italic>E. camaldulensis</italic>. This hypothesis assumes that there was a duplication event of <italic>18S rRNA</italic> into a proximal physical location of <italic>5S rRNA</italic>. Alternatively, another hypothesis suggests that there were two duplication events of the two genes in a common ancestor, with a subsequent loss of <italic>18S rRNA</italic> that happened in the lineage of <italic>E. grandis</italic>. Estimating the most likely evolution requires additional information regarding the state of the last common ancestor and more complete mitogenomes.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Repeat sequences and major isomeric forms of the mitogenome</title>
<p>The number of detected dispersed repeat sequences was 63, and the repeat size ranged from 50 bp to 9 kb (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>). In the long repeat category (&gt;1,000 bp), we identified pairs of IRs and DRs with lengths of 8,986 and 1,467 bp, respectively. As it has been argued that rearrangement mediated by long repeats is frequent in the plant mitogenomes (<xref ref-type="bibr" rid="B26">Siculella et&#xa0;al., 2001</xref>; <xref ref-type="bibr" rid="B27">Sloan, 2013</xref>), other possible isomeric forms were investigated by read mapping (see &#x201c;Materials and methods&#x201d;). Rearrangements by long repeat sequences are more common than those mediated by middle or short repeat sequences (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). In particular, isomeric forms mediated by the pair of the largest IR seem to exist at an equal frequency, similar to other plant mitochondria (<xref ref-type="bibr" rid="B28">Sloan et&#xa0;al., 2010</xref>) and chloroplast genomes (<xref ref-type="bibr" rid="B32">Wang and Lanfear, 2019</xref>). Rearrangement mediated by the second largest DR pair is also common. The data are consistent with a multipartite mitochondrial genome as a two-circle model (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). As an attempt to validate these rearrangements mediated by dispersed repeats, we analyzed our assembly using the Oxford Nanopore sequencing platform as an alternative and independent experiment (&#x201c;Materials and methods&#x201d;). Using the two independent sequencing technologies, we were able to validate the rearrangements mediated by repeat 1 and repeat 2 (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). There are also other rearrangements caused by shorter repeats (100 bp to 1 kb), but their frequency is significantly lower (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). In fact, 95% of mitochondrial reads mapped against either MC1 or MC2<sup>2</sup> fully and linearly in both the HiFi and ONT sequencing datasets, and the rest of the mitochondrial reads are mainly related to the minor rearrangements (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S3</bold>
</xref>). The HiFi sequencing data and further validation by ONT altogether support four major isomeric forms, including the single circle model (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>).</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Rates of the rearrangement mediated by repeat pairs.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Repeat pair</th>
<th valign="middle" align="center">Repeat length</th>
<th valign="middle" align="center">%reference</th>
<th valign="middle" align="center">%alternative</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Repeat-1a_b (IR)</td>
<td valign="middle" align="center">8,989</td>
<td valign="middle" align="center">50.98 (104)</td>
<td valign="middle" align="center">49.02 (100)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-2a_b (DR)</td>
<td valign="middle" align="center">1,467</td>
<td valign="middle" align="center">22.11 (174)</td>
<td valign="middle" align="center">77.89 (613)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-3a_b (IR)</td>
<td valign="middle" align="center">564</td>
<td valign="middle" align="center">97.74 (822)</td>
<td valign="middle" align="center">2.26 (19)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-4a_b (IR)</td>
<td valign="middle" align="center">317</td>
<td valign="middle" align="center">98.56 (1095)</td>
<td valign="middle" align="center">1.44 (16)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-5a_c (IR)</td>
<td valign="middle" align="center">188</td>
<td valign="middle" align="center">98.57 (553)</td>
<td valign="middle" align="center">1.43 (8)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-5b_c (IR)</td>
<td valign="middle" align="center">188</td>
<td valign="middle" align="center">99.16 (589)</td>
<td valign="middle" align="center">0.84 (5)</td>
</tr>
<tr>
<td valign="middle" align="center">Repeat-6a_b (DR)</td>
<td valign="middle" align="center">161</td>
<td valign="middle" align="center">99.53 (1055)</td>
<td valign="middle" align="center">0.47 (5)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Rates were estimated by read mapping. IR and DR stand for inverted repeat and direct repeat, respectively. Numbers in parenthesis in the rate columns indicate the number of supporting reads.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>
<bold>(A)</bold> Proposed major isomeric forms rearranged by the two large repeats, each greater than 1,000 bp. The large repeats are indicated by black arrows on circles, while the colored arcs represent regions separated by these repeats. The labels adjacent to the arrows on the circles correspond to the repeat names listed in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref> and are abbreviated as R-1 and R-2. <bold>(B)</bold> Uniform coverage (cov.) for both ONT and HiFi reads mapped to the assembly (MC1) as visualized by IGV (top). The coverage is slightly lower in the large repeat regions due to the rearrangements mediated by those repeats. These rearrangements are validated by the existence of both ONT and HiFi reads mapped fully only against the rearranged forms (middle and bottom) and not the reference form (top).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g003.tif"/>
</fig>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Minor rearrangements hinder <italic>de novo</italic> assembly by haplotype-aware methods</title>
<p>Since the contigs computed by hifiasm only partially matched the major isomeric sequences, we investigated the multiple contigs generated by hifiasm to understand the technical challenges for plant mitogenome assembly. The size of repeat-5 is 188 bp in length, and it is a part of another larger repeat-2 that has a length of 1,467 bp (188 bp of 1,173-th to 1,360-th positions of repeat-2). Repeat-2 is related to one of the major rearrangements (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>), and repeat-5 is detected by a 188-bp long sequence far away from the repeat-2 sequences (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>). Rearrangements explained by those small and nested repeat pairs appear to be important despite the low frequency (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>). Those minor isomeric sequences aligned well to the unique sequences found in the contigs computed by hifiasm, a haplotype-aware assembler (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>). A haplotype-aware assembler such as hifiasm would have concatenated major and minor isomeric forms together as single haplotypes (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>), and this seems to be the cause of multiple contigs.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Schematic diagram showing the effects of minor rearrangements mediated by smaller repeat pairs. <bold>(A)</bold> Hypothesized products of major and minor isomeric forms mediated by large (&gt;1,000 bp) repeats-1 and repeat-2, small (&lt; 1,000 bp) repeat-3, and a small and nested repeat-5. The black arrows on circles indicate the repeats, and the colored arcs represent regions separated by the repeats. The labels near the arrows on circles show the repeat names in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>. Repeat-1, repeat-2, repeat-3, and repeat-5 are abbreviated as R-1, R-2, R-3, and R-5 in the figure, respectively. Only relevant forms were extracted, and the full diagram is available as <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure S2</bold>
</xref>. <bold>(B)</bold> Longest contig (688,965 bp in length) generated by hifiasm which consists of sequences that aligned to hypothesized major isomeric form (MC1) and sequences which do not (MC2<sup>5ac</sup>, MC2<sup>3</sup>, and MC2<sup>2</sup>/MC1<sup>2</sup>). The hypothesized isomeric forms aligned are shown along a schematic line showing the contig. The arrows and colored lines represent repeats and regions separated by the repeats, respectively.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g004.tif"/>
</fig>
</sec>
<sec id="s3_5">
<label>3.5</label>
<title>Large inversion and fragments for the lost copy of <italic>18S rRNA</italic> in <italic>E. grandis</italic> mitogenome</title>
<p>A comparative analysis was performed on the mitogenomes of <italic>E. camaldulensis</italic> and <italic>E. grandis</italic> to understand how synteny is preserved between these two mitogenomes within the same genus. Overall synteny was found to remain intact except for a large inversion observed between positions 18,587 and 224,548 in the <italic>E. grandis</italic> mitogenome (corresponding to positions 19,028 and 212,830 in <italic>E. camaldulensis</italic>) (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). Despite the fact that synteny is still maintained to some degree, it does not explain a major difference: the hypothetical linear and circular form for them. Due to the absence of other reported mitogenomes in the <italic>Eucalyptus</italic> genus, phylogenetic reconstruction of the ancestral form remains infeasible. However, intriguing fragments with homology to the 5&#x2032; terminal of the <italic>E. camaldulensis</italic> genome were detected at both the 5&#x2032; and 3&#x2032; terminals of the <italic>E. grandis</italic> mitogenome (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). As indicated earlier, while the <italic>E. camaldulensis</italic> mitogenome encodes two copies of <italic>18S rRNA</italic> (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>), only one copy is retained in the <italic>E. grandis</italic> mitogenome (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). Given that this gene is encoded within repeat-1 of the <italic>E. camaldulensis</italic> mitogenome  (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>), we can envisage that this gene could serve as a crucial marker for historical tracking without necessitating additional mitogenomes. A sequence comparison using LAST unveiled mutated and fragmented sequences of <italic>18S rRNA</italic> in the <italic>E. grandis</italic> mitogenome (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). Notably, a fragment resembling a second half of the gene was located at the very 5&#x2032; end of the <italic>E. grandis</italic> mitogenome, and a fragment homologous to the first half of the gene was also recognized at the opposite end (3&#x2032; end) (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). It is worth noting that the <italic>E. grandis</italic> mitogenome has unique and non-homologous flanking sequences at both terminals, which is consistent with the genome&#x2019;s proposed linear structure.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Schematic diagram of the sequence comparison between <italic>E. grandis</italic> and <italic>E. camaldulensis</italic> (MC2) mitogenomes. <bold>(A)</bold> The plot illustrates synteny and structural rearrangements. The largest IR, referred to as &#x201c;R-1&#x201d; in <xref ref-type="fig" rid="f3">
<bold>Figures&#xa0;3</bold>
</xref>, <xref ref-type="fig" rid="f4">
<bold>4</bold>
</xref>, is represented by black triangles in the <italic>E. camaldulensis</italic> mitogenome (yellow). Additionally, there are four DR pairs in the <italic>E. grandis</italic> mitogenome (blue), which are homologous to the largest IR, also represented by black triangles. The total size of the four DR sequences and the IR length are shown in parenthesis. <bold>(B)</bold> Detailed sequence comparison in both terminals of two genomes is shown. Similarity to the plastid genome in the very 3&#x2032; end of <italic>E. grandis</italic> genome means similarity to some plastid genomes in <italic>Eucalyptus</italic>, which did not include the <italic>E. grandis</italic> plastid genome. Unique sequence in the 5&#x2032; end means no significant hit in the nr database of NCBI.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g005.tif"/>
</fig>
</sec>
<sec id="s3_6">
<label>3.6</label>
<title>Strong correlations exist between structural variations in the <italic>E. grandis</italic> mitogenome and homologous regions of the <italic>E. camaldulensis</italic> repeat-1</title>
<p>We identified four repeat pairs&#x2014;DR-1 (1,148 bp), DR-2 (366 bp), DR-3 (4,210 bp), and DR-4 (206 bp)&#x2014;in <italic>E. grandis</italic> mitogenome (<xref ref-type="bibr" rid="B25">Pinard et&#xa0;al., 2019</xref>) as homologous to repeat-1, the largest IR in <italic>E. camaldulensis</italic> (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). The combined length of these four repeat pairs is still shorter than that of repeat-1 (5,930 vs. 8,986 bp), suggesting that a split event may have occurred. On the opposite side of the <italic>E. grandis</italic> genome, a similarity to repeat-1, identified as fragmented <italic>18S rRNA</italic>, is also observed (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). Assuming that the homologous fragments at both the 5&#x2032; and 3&#x2032; ends of this mitogenome originated from a single repeat sequence (i.e., repeat-1a), it is possible that either fragment could retain similarity to the homolog of its counterpart, termed repeat-1b. Pinard et&#xa0;al. described three structural variations, termed BP1, BP2, and BP3, with a high degree of confidence (<xref ref-type="bibr" rid="B25">Pinard et&#xa0;al., 2019</xref>). Of these variations, BP2 was associated with a rearrangement event triggered by a pair of DRs observed in the <italic>E. grandis</italic> mitogenome. However, no such associations could be made for the other two variations, BP1 and BP3. Notably, the breakpoints of BP3 coincided with two homologous regions 2 kb distant from the start of repeat-1 (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). Furthermore, one breakpoint of BP1 overlapped with a region at the start of repeat-1b, and the other breakpoint coincided with another region homologous to the end of the <italic>E. camaldulensis</italic> mitogenome. Due to its continuous nature (represented as circular form), this end region seamlessly transitions into the start of repeat-1a in the <italic>E. camaldulensis</italic> mitogenome. These structural variants together show a strong correlation (within 250 bp) with respect to the <italic>E. camaldulensis</italic> coordinates (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>).</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Highly confident structural variations observed in the <italic>E. grandis</italic> mitogenome (blue). We extracted breakpoints for BP1 and BP3 from the original paper. If we map breakpoints for BP3 onto homologous coordinates on <italic>E. camaldulensis</italic> mitogenome (yellow), they pinpoint to a region 2 kb away from the beginning of repeat-1. Similarly, breakpoints for BP1 can be mapped to a very similar point in <italic>E. camaldulensis</italic> mitogenome, around the beginning of repeat-1.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-15-1339594-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>In this study, we present the first and high-quality mitogenome of <italic>E. camaldulensis</italic> which completes the entire genomic assemblies of <italic>E. camaldulensis</italic>. This is also the second report of a mitogenome in the <italic>Eucalyptus</italic> genus. The fact that there are only two mitogenomes compared to the many nuclear genome assemblies from this genus indicates how challenging it is to assemble plant mitogenomes. Genomic features such as low mutation rates and abundant repeats, often involved in homologous recombination, are considered outcomes of DNA repair systems, particularly those addressing double-strand breaks (DSBs) (<xref ref-type="bibr" rid="B10">Christensen, 2013</xref>). In this context, repeat-mediated rearrangements are viewed as repair system errors. This aligns with common features observed in plant mitogenomes, especially those rearrangements facilitated by small repeat sequences. Larger repeat sequences (i.e., repeats longer than 1,000 bp) have been found to induce structural changes or isomerization in plant mitogenomes (<xref ref-type="bibr" rid="B28">Sloan et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B34">Wynn and Christensen, 2019</xref>).</p>
<p>Our results indicate that the rate of rearrangement by the largest repeat remains steady at around 50%; however, the rate for the second largest repeat is more unbalanced (<xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>). Based on these findings, we propose four primary isomeric forms comprising both single circle structures and multi-circular sub-genomic structures (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>).</p>
<p>HiFi reads, which we used in the assembly of the mitogenome, confirmed the existence of the significant rearrangements mediated by the largest and the second largest repeats (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). In fact, even with accurate long reads, the mitogenome assembly can still be challenging in repetitive regions (<xref ref-type="bibr" rid="B7">Chen et&#xa0;al., 2021</xref>). Therefore, we manually analyzed repeat regions highlighting those reads that span the entire repeat as well as flanking sequences to rule out any potential errors introduced by repeat units on the assembly graph (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S3, S4</bold>
</xref>).</p>
<p>Additionally, we further validated our results using an ONT sequencing dataset that was not used in the genome assembly. Overall, both HiFi and ONT reads aligned to the assembled sequences of the major isoforms, validating the assembly (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>; <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figures S3, S4</bold>
</xref>). These experiments and analyses support the existence of multiple isoforms of the genome and their respective sequences. This characteristic of plant mitogenomes has implications for phylogenetic analysis, especially among closely related species. While low mutation rates in protein coding genes and high variation in non-coding regions pose technical challenges in phylogenetic analysis, sequence alignment that considers rearrangement is helpful in overcoming these challenges.</p>
<p>A nested relationship was observed in the genome as one repeat sequence, repeat-5, is part of a larger sequence, termed repeat-2. While nested pair rearrangements appear to be infrequent, such complex repeat pairs hampered assembly by haplotype-aware methods, presumably due to the methods&#x2019; sensitivity. Haplotype-aware assemblers aim to keep one haplotype contiguous (<xref ref-type="bibr" rid="B9">Cheng et&#xa0;al., 2021</xref>), which is not always ideal for organelle genome assemblies. Indeed an approach that takes into account the characteristics of plant organelle genomes would be better suited to reconstructing major forms of plant mitochondrial genomes that may have undergone complex rearrangements with identical sequences.</p>
<p>Even if major forms could be partially detected by a conventional approach, a <italic>post-hoc</italic> analysis was still required to obtain the full picture of mitogenome dynamism. Infrequent nested pair rearrangements need complex structures, even when the repeat graph format is represented. An example of this complexity is a &#x201c;triple-fork&#x201d; structure to represent rearrangements mediated by nested repeat pairs, which is more intricate than the recently suggested &#x201c;double-fork&#x201d; structure (<xref ref-type="bibr" rid="B14">Fischer et&#xa0;al., 2022</xref>). This observation shows that more theoretical progress is needed in this field.</p>
<p>In regard to the evolution of <italic>18S</italic> and <italic>5S rRNA</italic> genes, the presence of mutated <italic>18S rRNA</italic> in the mitogenome of <italic>E. grandis</italic> supports that there was another copy of <italic>18S rRNA</italic> and the loss event of that copy. It is likely that the last common ancestor of <italic>E. grandis</italic> and <italic>E. camaldulensis</italic> possessed two copies of <italic>18S rRNA</italic> in the mitogenome. An alternative scenario would involve two independent duplications of the genes after the divergence to the ancestors of <italic>E. camaldulensis</italic> and <italic>E. grandis</italic>. However, this scenario is less likely because it assumes two duplication events of the gene into a similar physical location on each genome, i.e., next to <italic>5S rRNA</italic>. It is worth noting that the mitogenomes of <italic>S. samarangense</italic>, <italic>R. tomentosa</italic>, and <italic>B. coptidifolia</italic> are annotated to contain only one copy of <italic>18S rRNA</italic> and <italic>5S rRNA</italic>. It is likely that the duplication of a relatively long sequence containing both <italic>18S rRNA</italic> and <italic>5S rRNA</italic> genes, rather than the duplication of single genes, occurred during the divergence to the <italic>Eucalyptus</italic> genus in the <italic>Myrtaceae</italic> family, followed by the loss of <italic>18S rRNA</italic> gene in the lineage of <italic>E. grandis</italic> along with the splitting of the repeat sequence (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>).</p>
<p>If DSBs are common in the plant mitochondria, failure in DNA repair mechanisms may be inherited and maintained over evolutionary time. If DSB is a rare condition, failure in DNA repair mechanisms would have less impact; however, it is important to note that rearrangements can also lead to the development of novel biological functions. One possible example is cytoplasmic male sterility, a phenomenon in plants that prevents them from producing viable pollen and has been linked to mitochondrial genome rearrangements (<xref ref-type="bibr" rid="B23">Mower et&#xa0;al., 2012</xref>). DSBs could be the reason for the discrepancy between the mitogenomes of <italic>E. camaldulensis</italic> and <italic>E. grandis</italic>. As discussed above, the presence of a mutated and fragmented copy of <italic>18S rRNA</italic> in the mitogenome of <italic>E. grandis</italic> suggests that the last common ancestral mitogenome of both <italic>E. grandis</italic> and <italic>E, camaldulensis</italic> should have contained two copies of <italic>18S rRNA</italic> similar to the mitochondria of <italic>E. camaldulensis</italic>. Following this suggestion, a DSB event could have occurred in between a region equivalent to repeat-1a. This is also supported by the non-homologous sequences at both ends of <italic>E. grandis</italic> mitogenome (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). The hypothetical linear form of the <italic>E. grandis</italic> genome is consistent with the flanking sequences at both 5&#x2032; and 3&#x2032; ends, which are dissimilar to those of <italic>E. camaldulensis</italic> and any other mitogenome. The 5&#x2032; flanking sequence is quite unique, and we were unable to detect any significant matches in the NCBI nucleotide database. There is instead a similarity between the 3&#x2032; flanking sequence and the chloroplast genomes of other plant species. Unfortunately, we lack data to explain the reason, and more mitogenomes and further analysis will be required in the future.</p>
<p>One interesting nature of repeat sequences is their plasticity. Any subsequences in a repeat sequence can also generate a new repeat pair if the equivalent subsequence appears in another location. This plasticity feature has been detected in our study as nested repeat sequences. Rearrangements mediated by nested repeat pairs were also observed in the longest contig computed by hifiasm. Conventional genome assemblers are not designed to resolve all variations caused by complex repeats (<xref ref-type="bibr" rid="B14">Fischer et&#xa0;al., 2022</xref>). Multiple algorithms should be applied to complete both nuclear and organelle genome assemblies, at least in plant genome projects.</p>
<p>The other feature of repeat plasticity is high separability. If a repeat sequence of a pair is cut <italic>n</italic> times, <italic>n+1</italic> subsequences should keep similarity to the counterparts in the other sequence of the pair. This could lead to new <italic>n+1</italic> pairs of repeat sequences in the following generations if inherited. Although it was not obvious in the primary structure of the <italic>E. grandis</italic> mitogenome, two high-confidence structural variations seem to be two recent pairs of repeats generated by a single DSB event (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). Even breakage of a repeat would not have lost its repeat characteristic.</p>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>In this study, we presented the first and high-quality mitogenome of <italic>E. camaldulensis</italic>. Although the mitogenome is much smaller than the nuclear genome, its nature in plant species could hinder genome assembly. Rearrangements mediated by dispersed repeat can lead to fragmentation in the assembly graph, having resulted in a lower number of available sequences than the nuclear assembly. A comparison of the mitogenomes of <italic>E. camaldulensis</italic> and <italic>E. grandis</italic> revealed a unique alteration of the repeat sequences at the evolutionary scale. Repeat sequences exhibit a high level of plasticity, which may contribute to the diversity and evolution of plant mitochondria. The presented mitogenome will serve as a reference for further analyses of other eucalypts.</p>
</sec>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The complete mitogenome sequence of <italic>E. camaldulensis</italic> has been submitted to GenBank with the accession number OR763353. The ONT sequencing data utilized for the assembly validation is available under NCBI BioProject ID PRJNA737587. </p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>YF: Writing &#x2013; original draft, Visualization, Funding acquisition, Formal Analysis, Conceptualization. PD: Writing &#x2013; review &amp; editing, Resources, Investigation. SB: Validation, Writing &#x2013; review &amp; editing, Data curation. KC: Writing &#x2013; review &amp; editing, Investigation, Data curation. AP: Writing &#x2013; review &amp; editing, Investigation, Data curation. M-SC: Writing &#x2013; review &amp; editing, Visualization, Resources. LE: Writing &#x2013; original draft, Formal Analysis, Conceptualization.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. The study was partly supported by the startup funding from Utsunomiya University (<ext-link ext-link-type="uri" xlink:href="https://www.utsunomiya-u.ac.jp/en/">https://www.utsunomiya-u.ac.jp/en/</ext-link>) and JSPS KAKENHI Grant Number 23K19338 to YF.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We thank the KAUST Bioscience Core Labs for providing technical support for the data generation. Computations in this study were partially performed on the NIG supercomputer at ROIS National Institute of Genetics.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors&#xa0;and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2024.1339594/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2024.1339594/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adams</surname> <given-names>K. L.</given-names>
</name>
<name>
<surname>Qiu</surname> <given-names>Y.-L.</given-names>
</name>
<name>
<surname>Stoutemyer</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Punctuated evolution of mitochondrial gene content: high and variable rates of mitochondrial gene loss and transfer to the nucleus during angiosperm evolution</article-title>. <source>Proc. Natl. Acad. Sci. United States America</source> <volume>99</volume>, <fpage>9905</fpage>&#x2013;<lpage>9125</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.042694899</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Altschul</surname> <given-names>S. F.</given-names>
</name>
<name>
<surname>Madden</surname> <given-names>T. L.</given-names>
</name>
<name>
<surname>Sch&#xe4;ffer</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>1997</year>). <article-title>Gapped BLAST and PSI-BLAST: A new generation of protein database search programs</article-title>. <source>Nucleic Acids Res.</source> <volume>25</volume>, <fpage>3389</fpage>&#x2013;<lpage>3402</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/25.17.3389</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alverson</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Wei</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Rice</surname> <given-names>D. W.</given-names>
</name>
<name>
<surname>Stern</surname> <given-names>D. B.</given-names>
</name>
<name>
<surname>Barry</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Insights into the evolution of mitochondrial genome size from complete sequences of citrullus lanatus and cucurbita pepo (Cucurbitaceae)</article-title>. <source>Mol. Biol. Evol.</source> <volume>27</volume>, <fpage>1436</fpage>&#x2013;<lpage>1485</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msq029</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arrieta-Montiel</surname> <given-names>M. P.</given-names>
</name>
<name>
<surname>Shedge</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Davila</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Christensen</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Mackenzie</surname> <given-names>S. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Diversity of the arabidopsis mitochondrial genome occurs via Nuclear-Controlled Recombination Activity</article-title>. <source>Genet.</source> <volume>183</volume>, <fpage>1261</fpage>&#x2013;<lpage>1685</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1534/genetics.109.108514</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Butcher</surname> <given-names>P. A.</given-names>
</name>
<name>
<surname>Otero</surname> <given-names>A.</given-names>
</name>
<name>
<surname>McDonald</surname> <given-names>M. W.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>G. F.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Nuclear RFLP variation in eucalyptus camaldulensis dehnh. from Northern Australia</article-title>. <source>Heredity</source> <volume>88</volume>, <fpage>402</fpage>&#x2013;<lpage>412</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sj.hdy.6800074</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname> <given-names>P. P.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>B. Y.</given-names>
</name>
<name>
<surname>Mak</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Lowe</surname> <given-names>T. M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>TRNAscan-SE 2.0: improved detection and functional classification of transfer RNA genes</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>9077</fpage>&#x2013;<lpage>9965</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkab688</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>A. Y.</given-names>
</name>
<name>
<surname>Gao</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chong</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Accurate long-read de novo assembly evaluation with inspector</article-title>. <source>Genome Biol.</source> <volume>22</volume>, <fpage>3125</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-021-02527-4</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Grover</surname> <given-names>C. E.</given-names>
</name>
<name>
<surname>Nie</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wendel</surname> <given-names>J. F.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Plant mitochondrial genome evolution and cytoplasmic male sterility</article-title>. <source>Crit. Rev. Plant Sci.</source> <volume>36</volume>, <fpage>55</fpage>&#x2013;<lpage>695</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/07352689.2017.1327762</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Concepcion</surname> <given-names>G. T.</given-names>
</name>
<name>
<surname>Feng</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Haplotype-resolved de novo assembly using phased assembly graphs with hifiasm</article-title>. <source>Nat. Methods</source> <volume>18</volume>, <fpage>170</fpage>&#x2013;<lpage>755</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41592-020-01056-5</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christensen</surname> <given-names>A. C.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Plant mitochondrial genome evolution can be explained by DNA repair mechanisms</article-title>. <source>Genome Biol. Evol.</source> <volume>5</volume>, <fpage>1079</fpage>&#x2013;<lpage>1086</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evt069</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cole</surname> <given-names>L. W.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Mower</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>High and variable rates of repeat-mediated mitochondrial genome rearrangement in a genus of plants</article-title>. <source>Mol. Biol. Evol.</source> <volume>35</volume>, <fpage>2773</fpage>&#x2013;<lpage>2855</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msy176</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Darling</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Mau</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Perna</surname> <given-names>N. T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>ProgressiveMauve: multiple genome alignment with gene gain, loss and rearrangement</article-title>. <source>PloS One</source> <volume>5</volume>, <elocation-id>e111475</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0011147</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Driguez</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Bougouffa</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Carty</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Putra</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Jabbari</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Reddy</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>LeafGo: leaf to genome, a quick workflow to produce high-quality de novo plant genomes using long-read sequencing technology</article-title>. <source>Genome Biol.</source> <volume>22</volume>, <fpage>2565</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-021-02475-z</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fischer</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Dotzek</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Walther</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Greiner</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Graph-based models of the oenothera mitochondrial genome capture the enormous complexity of higher plant mitochondrial DNA organization</article-title>. <source>NAR Genomics Bioinf.</source> <volume>4</volume>, <fpage>lqac027</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nargab/lqac027</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fukasawa</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tsuji</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>S. C.</given-names>
</name>
<name>
<surname>Tomii</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Horton</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>MitoFates: improved prediction of mitochondrial targeting sequences and their cleavage sites</article-title>. <source>Mol. Cell. Proteomics</source>. <volume>14</volume>, <fpage>1113</fpage>&#x2013;<lpage>1126</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/mcp.M114.043083</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goel</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Jiao</surname> <given-names>W.-B.</given-names>
</name>
<name>
<surname>Schneeberger</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>SyRI: finding genomic rearrangements and local sequence differences from whole-genome assemblies</article-title>. <source>Genome Biol.</source> <volume>20</volume>, <fpage>2775</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13059-019-1911-0</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Greiner</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lehwark</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Bock</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>OrganellarGenomeDRAW (OGDRAW) version 1.3.1: expanded toolkit for the graphical visualization of organellar genomes</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>W59</fpage>&#x2013;<lpage>W64</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkz238</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kie&#x142;basa</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>Wan</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sato</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Horton</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Frith</surname> <given-names>M. C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Adaptive seeds tame genomic sequence comparison</article-title>. <source>Genome Res.</source> <volume>21</volume>, <fpage>487</fpage>&#x2013;<lpage>935</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.113985.110</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kolmogorov</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>Yu</given-names>
</name>
<name>
<surname>Pevzner</surname> <given-names>P. A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Assembly of long, error-prone reads using repeat graphs</article-title>. <source>Nat. Biotechnol.</source> <volume>37</volume>, <fpage>540</fpage>&#x2013;<lpage>465</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41587-019-0072-8</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Minimap2: pairwise alignment for nucleotide sequences</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>3094</fpage>&#x2013;<lpage>3100</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>L&#xf6;tter</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Duong</surname> <given-names>T. A.</given-names>
</name>
<name>
<surname>Candotti</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Mizrachi</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Wegrzyn</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Myburg</surname> <given-names>A. A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Haplogenome assembly reveals structural variation in eucalyptus interspecific hybrids</article-title>. <source>GigaScience</source> <volume>12</volume>, <fpage>giad064</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/giad064</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q.</given-names>
</name>
</person-group> (<year>2024</year>). <article-title>Complete mitochondrial genome of syzygium samarangense reveals genomic recombination, gene transfer, and RNA editing events</article-title>. <source>Front. Plant Sci.</source> <volume>14</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2023.1301164</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mower</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Case</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Floro</surname> <given-names>E. R.</given-names>
</name>
<name>
<surname>Willis</surname> <given-names>J. H.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Evidence against equimolarity of large repeat arrangements and a predominant master circle structure of the mitochondrial genome from a monkeyflower (Mimulus guttatus) lineage with cryptic CMS</article-title>. <source>Genome Biol. Evol.</source> <volume>4</volume>, <fpage>670</fpage>&#x2013;<lpage>865</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evs042</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Myburg</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Grattapaglia</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Tuskan</surname> <given-names>G. A.</given-names>
</name>
<name>
<surname>Hellsten</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Hayes</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Grimwood</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>The genome of eucalyptus grandis</article-title>. <source>Nature</source> <volume>510</volume>, <fpage>356</fpage>&#x2013;<lpage>362</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature13308</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pinard</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Myburg</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Mizrachi</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The plastid and mitochondrial genomes of eucalyptus grandis</article-title>. <source>BMC Genomics</source> <volume>20</volume>, <fpage>1325</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12864-019-5444-4</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siculella</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Damiano</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Cortese</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Dassisti</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Rainaldi</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Gallerani</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>Gene content and organization of the oat mitochondrial genome</article-title>. <source>TAG. Theor. Appl. Genet. Theoretische Und Angewandte Genetik</source> <volume>103</volume>, <fpage>359</fpage>&#x2013;<lpage>365</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s001220100568</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sloan</surname> <given-names>D. B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>One ring to rule them all? Genome sequencing provides new insights into the &#x2018;master circle&#x2019; Model of plant mitochondrial DNA structure</article-title>. <source>New Phytol.</source> <volume>200</volume>, <fpage>978</fpage>&#x2013;<lpage>985</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/nph.12395</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sloan</surname> <given-names>D. B.</given-names>
</name>
<name>
<surname>Alverson</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Storchov&#xe1;</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Palmer</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>D. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Extensive loss of translational genes in the structurally dynamic mitochondrial genome of the angiosperm silene latifolia</article-title>. <source>BMC Evol. Biol.</source> <volume>274</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2148-10-274</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Rearrangement and domestication as drivers of rosaceae mitogenome plasticity</article-title>. <source>BMC Biol.</source> <volume>20</volume>, <fpage>1815</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12915-022-01383-3</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tamura</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Stecher</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>MEGA11: molecular evolutionary genetics analysis version 11</article-title>. <source>Mol. Biol. Evol.</source> <volume>38</volume>, <fpage>3022</fpage>&#x2013;<lpage>3275</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msab120</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Das</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Kainer</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Schalamun</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Morales-Suarez</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Schwessinger</surname> <given-names>B.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>The draft nuclear genome assembly of eucalyptus pauciflora: A pipeline for comparing de novo assemblies</article-title>. <source>GigaScience</source> <volume>9</volume>, <fpage>giz160</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gigascience/giz160</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Lanfear</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Long-reads reveal that the chloroplast genome exists in two distinct versions in most plants</article-title>. <source>Genome Biol. Evol.</source> <volume>11</volume>, <fpage>3372</fpage>&#x2013;<lpage>3815</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evz256</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Waneka</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Broz</surname> <given-names>A. K.</given-names>
</name>
<name>
<surname>King</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>Sloan</surname> <given-names>D. B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>MSH1 is required for maintenance of the low mutation rates in plant mitochondrial and plastid genomes</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>117</volume>, <fpage>16448</fpage>&#x2013;<lpage>16555</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.2001998117</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wynn</surname> <given-names>E. L.</given-names>
</name>
<name>
<surname>Christensen</surname> <given-names>A. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Repeats of unusual size in plant mitochondrial genomes: identification, incidence and evolution</article-title>. <source>G3: Genes Genom. Genet.</source> <volume>9</volume>, <fpage>549</fpage>&#x2013;<lpage>595</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1534/g3.118.200948</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>