<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3-mathml3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="1.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title-group>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
</journal-title-group>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2026.1736783</article-id>
<article-version article-version-type="Version of Record" vocab="NISO-RP-8-2008"/>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Original Research</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Plastid genome variation in the green algal genus <italic>Coelastrum</italic> (Scenedesmaceae)</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Lee</surname><given-names>Chanhee</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3252230/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing &#x2013; original draft</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="visualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Jansen</surname><given-names>Robert K.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/486483/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
</contrib>
<contrib contrib-type="author">
<name><surname>Theriot</surname><given-names>Edward C.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/3301308/overview"/>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Project-administration" vocab-term-identifier="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing &#x2013; review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing &#x2013; review &amp; editing</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
</contrib>
</contrib-group>
<aff id="aff1"><label>1</label><institution>Plant Biology Graduate Program, University of Texas at Austin</institution>, <city>Austin</city>, <state>TX</state>,&#xa0;<country country="us">United States</country></aff>
<aff id="aff2"><label>2</label><institution>Department of Integrative Biology, University of Texas at Austin</institution>, <city>Austin</city>, <state>TX</state>,&#xa0;<country country="us">United States</country></aff>
<author-notes>
<corresp id="c001"><label>*</label>Correspondence: Chanhee Lee, <email xlink:href="mailto:chanhee.lee@utexas.edu">chanhee.lee@utexas.edu</email></corresp>
</author-notes>
<pub-date publication-format="electronic" date-type="pub" iso-8601-date="2026-02-09">
<day>09</day>
<month>02</month>
<year>2026</year>
</pub-date>
<pub-date publication-format="electronic" date-type="collection">
<year>2026</year>
</pub-date>
<volume>17</volume>
<elocation-id>1736783</elocation-id>
<history>
<date date-type="received">
<day>31</day>
<month>10</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>16</day>
<month>01</month>
<year>2026</year>
</date>
<date date-type="rev-recd">
<day>13</day>
<month>01</month>
<year>2026</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2026 Lee, Jansen and Theriot.</copyright-statement>
<copyright-year>2026</copyright-year>
<copyright-holder>Lee, Jansen and Theriot</copyright-holder>
<license>
<ali:license_ref start_date="2026-02-09">https://creativecommons.org/licenses/by/4.0/</ali:license_ref>
<license-p>This is an open-access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution License (CC BY)</ext-link>. The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</license-p>
</license>
</permissions>
<abstract>
<p>Plastid genomes (plastomes) in green algae display remarkable variation in size and structure, yet comprehensive species and strain-level analyses remain rare. Here, we present a detailed plastome comparison across 29 strains of nine nominal species of the genus <italic>Coelastrum</italic> (Scenedesmaceae). Sizes ranged from 166,827 bp to 553,457 bp, the latter representing the largest plastomes reported to date in the order Sphaeropleales. An almost twofold size difference was observed between strains of the same species, <italic>Coelastrum morus</italic>, highlighting unprecedented intraspecific plastome expansion in closely related green algae. Comparative analyses revealed that plastome size variation is primarily driven by the expansion of non-coding regions and repeats accumulation, with additional contributions from inverted repeat (IR) length and intron contents. Phylogenomic inference based on shared protein-coding genes recovered well-supported clades and resolved species-level relationships, offering improved taxonomic resolution relative to previous analyses based on several single gene analyses (nuclear ITS, nuclear SSU, <italic>tufA</italic>) which provided different relationships among critical taxa in <italic>Coelastrum</italic> and <italic>Hariotina</italic>. However, uneven taxon and strain sampling among molecular phylogenetic studies of <italic>Coelastrum</italic> and closely related Scenedesmaceae, including ours, is possibly as much of an obstacle to resolution of incongruences as is gene sampling. While gene content was largely conserved, we documented several lineage-specific gene and tRNA losses and unique intron insertions, reflecting dynamic structural evolution. Our results provide new insights into plastome architecture, intron evolution, and species boundaries within <italic>Coelastrum</italic>, and demonstrate the value of dense taxon and strain sampling for understanding plastid genome evolution in Chlorophyta.</p>
</abstract>
<kwd-group>
<kwd><italic>Coelastrum</italic></kwd>
<kwd>intron distribution</kwd>
<kwd>phylogenomics</kwd>
<kwd>plastome evolution</kwd>
<kwd>plastome size variation</kwd>
<kwd>repetitive DNA</kwd>
</kwd-group>
<funding-group>
<funding-statement>The author(s) declared that financial support was received for this work and/or its publication. This work was supported by the Harold C. and Mary D. Bold Professorship in Cryptogamic Botany (Phycology); the U.S. National Science Foundation (NSF) grant 1754614; and the Texas Ecological Laboratory Program.</funding-statement>
</funding-group>
<counts>
<fig-count count="4"/>
<table-count count="2"/>
<equation-count count="0"/>
<ref-count count="63"/>
<page-count count="16"/>
<word-count count="9230"/>
</counts>
<custom-meta-group>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Aquatic Photosynthetic Organisms</meta-value>
</custom-meta>
</custom-meta-group>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>The plastid genome (plastome) of green algae typically exhibits a conserved quadripartite structure, consisting of two copies of an inverted repeat (IR) that encode the ribosomal RNA (rRNA) operon, separated by small single-copy (SSC) and large single-copy (LSC) regions (<xref ref-type="bibr" rid="B31">Lang and Nedelcu, 2012</xref>; <xref ref-type="bibr" rid="B39">Mower and Vickrey, 2018</xref>). Although this organization is shared with most land plants, plastome size and structure in green algae are notably more variable, ranging from as small as 64 kb to over 520 kb, compared to the 120&#x2013;160 kb range in most photosynthetic seed plants (<xref ref-type="bibr" rid="B59">Wicke et&#xa0;al., 2011</xref>; <xref ref-type="bibr" rid="B24">Jansen and Ruhlman, 2012</xref>). For example, the plastome of <italic>Prasinophyceae</italic> sp. is only 64 kb in length with highly contracted intergenic regions comprising 10% of the genome (<xref ref-type="bibr" rid="B34">Lemieux et&#xa0;al., 2014</xref>). In contrast, <italic>Haematococcus lacustris</italic> and <italic>H. pluvialis</italic> have the largest green algal genomes discovered to date at over 1.35 Mb (<xref ref-type="bibr" rid="B3">Bauman et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>). The primary contributor to large genome size in these and other green algae with plastomes over 500 kb, such as <italic>Floydiella terrestris</italic> and <italic>Volvox carteri</italic> are large non-coding intergenic regions which can account for up to 80% of their total genome size (<xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B49">Smith and Lee, 2010</xref>; <xref ref-type="bibr" rid="B46">Smith, 2018</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>).</p>
<p>Inverted repeat regions are evolutionarily dynamic across higher-level taxonomic categories in the Chlorophyta. There are examples of expansion or contraction in families as diverse as Chlorellaceae, Pedinomonadaceae, Prasiolaceae, and Trebouxiaceae (<xref ref-type="bibr" rid="B55">Turmel et&#xa0;al., 2017</xref>). More rarely, independent losses have been reported for <italic>F. terrestris</italic> (Chlorophyceae), <italic>Stigeoclonium helveticum</italic> (Chlorophyceae), <italic>Bryopsis plumosa</italic> (Ulvophyceae), and several Trebouxiophyceae species (<xref ref-type="bibr" rid="B4">B&#xe9;langer et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B54">Turmel et&#xa0;al., 2015</xref>, <xref ref-type="bibr" rid="B51">2016</xref>). Despite these insights, comprehensive studies of plastome evolution at the intraspecific or intrageneric level remain rare, limiting our understanding of structural diversity at lower taxonomic levels.</p>
<p>Plastome size variation in green algae is driven by several evolutionary factors, including differences in intron content, intergenic region size, IR variation, repeats, and gene loss. Intron distribution has been documented across major chlorophyte classes, including Trebouxiophyceae, Ulvophyceae, and Chlorophyceae (<xref ref-type="bibr" rid="B11">de Cambiaire et&#xa0;al., 2006</xref>, <xref ref-type="bibr" rid="B12">2007</xref>; <xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B53">Turmel and Lemieux, 2018</xref>; <xref ref-type="bibr" rid="B58">Wang et&#xa0;al., 2019</xref>, <xref ref-type="bibr" rid="B57">2024</xref>; <xref ref-type="bibr" rid="B61">Zhao et&#xa0;al., 2022</xref>). These studies span multiple plastid genes, such as <italic>atpB</italic>, <italic>psaA</italic>, <italic>psaB</italic>, <italic>psbC</italic>, <italic>psbD</italic>, and <italic>rbcL</italic>. The number, size, and lineage-specific presence of these introns have been shown to contribute significantly to plastome size and complexity (<xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>). Additionally, gene loss has been a pervasive force shaping plastome architecture in green algae. The ancestral green algal plastome is estimated to have encoded approximately 141 genes (<xref ref-type="bibr" rid="B53">Turmel and Lemieux, 2018</xref>) but substantial gene loss occurred across major lineages such as Prasinophytes and core Chlorophytes, including <italic>Coelastrum</italic>. Many of these losses have been attributed to gene transfers from the plastome to the nuclear genome (<xref ref-type="bibr" rid="B50">Stegemann et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B41">Palenik et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B44">Robbens et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B52">Turmel et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B53">Turmel and Lemieux, 2018</xref>). In Sphaeropleales, multiple genes involved in photosynthesis, plastid maintenance, and gene expression have been lost, reflecting a dynamic pattern of genome streamlining and functional reorganization (<xref ref-type="bibr" rid="B18">Fu&#x10d;&#xed;kov&#xe1; et&#xa0;al., 2016</xref>).</p>
<p>Despite growing interest in plastome phylogenomics within green algae, detailed investigations of intron variation and gene loss at the species level remain limited, particularly within genera that include multiple closely related taxa. Most comparative analyses have focused on broad phylogenetic scales, leaving gaps in our understanding of how plastome evolution operates within specific clades (<xref ref-type="bibr" rid="B34">Lemieux et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B54">Turmel et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B18">Fu&#x10d;&#xed;kov&#xe1; et&#xa0;al., 2016</xref>).</p>
<p>The genus <italic>Coelastrum</italic> (family Scenedesmaceae, order Sphaeropleales) represents an ideal group for addressing these gaps. Though <italic>Coelastrum</italic> is cosmopolitan and ecologically important, its organellar genome evolution remains largely unexplored. A molecular phylogenetic analysis by <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> based on nuclear 18S ribosomal DNA (rDNA) and internal transcribed spacer 2 (ITS2) secondary structure suggested that <italic>Coelastrum</italic> may be non-monophyletic, with weakly supported interspecific relationships and several sister species relationships unresolved. In contrast, plastid genes such as <italic>rbcL</italic> and <italic>tufA</italic> have shown stronger phylogenetic signal in Scenedesmaceae and other chlorophytes (<xref ref-type="bibr" rid="B45">Sciuto et&#xa0;al., 2015</xref>), highlighting the need for plastome-level data to clarify relationships.</p>
<p>To date, only 19 complete plastomes have been published from the Scenedesmaceae (<xref ref-type="bibr" rid="B11">de Cambiaire et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B58">Wang et&#xa0;al., 2019</xref>, <xref ref-type="bibr" rid="B57">2024</xref>, <xref ref-type="bibr" rid="B56">2025</xref>; <xref ref-type="bibr" rid="B14">Douchi et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B61">Zhao et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B9">Cho and Lee, 2024</xref>; <xref ref-type="bibr" rid="B60">Xu et&#xa0;al., 2024</xref>), of which only one was a <italic>Coelastrum</italic> (<xref ref-type="bibr" rid="B32">Lee et&#xa0;al., 2023</xref>). In this paper, we added 28 newly sequenced plastomes from different strains of <italic>Coelastrum</italic>, for a total of 29 <italic>Coelastrum</italic> strains, spanning 9 nominal species, and compared them to 18 outgroup strains representing 18 species or subspecific taxa in 8 genera. We examined variation in genome size, IR boundaries, intron content, repeat element, and gene loss to provide an in-depth genomic perspective on organellar evolution within <italic>Coelastrum</italic>.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Taxon sampling and DNA extraction</title>
<p>We reconstructed the plastome of 28 strains of <italic>Coelastrum</italic>. We isolated 11 new strains of <italic>Coelastrum</italic> from Gull Lake (3 strains), Swan Lake (4 strains), and Wintergreen Lake (2 strains) in Michigan, Coral Gables Canal in Florida (1 strain), and Lake Buchanan (1 strain) in Texas, all collected using a 20 &#x3bc;m mesh plankton net. The isolated strains were cultured and maintained in WC (Wright Chu) artificial freshwater media (<xref ref-type="bibr" rid="B19">Guillard, 1975</xref>). Another eight strains were obtained from the UTEX Culture Collection, and ten strains were acquired from the Experimental Phycology and Culture Collection of Algae (EPSAG). Additionally, one <italic>Coelastrum</italic> plastome and 18 Scenedesmaceae outgroup plastomes were downloaded from NCBI (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/">http://www.ncbi.nlm.nih.gov/</ext-link>) for phylogenetic analysis: <italic>Coelastrum microporum</italic> (NC068582), <italic>Asterarcys</italic> sp. (MK995333), <italic>Coccoidesmus tetrasporum</italic> (OR350844), <italic>Coelastrella saipanensis</italic> (NC042181), <italic>Coronastrum ellipsoideum</italic> (PP979513), <italic>Crucigenia lauterbornii</italic> (PP979532), <italic>Crucigenia quadrata</italic> (PQ301446), <italic>Desmodesmus abundans</italic> (NC066651), <italic>Desmodesmus</italic> sp<italic>inosus</italic> (PV295633), <italic>Pectinodesmus pectinatus</italic> (NC036668), <italic>Tetradesmus arenicola</italic> (NC086756), <italic>Tetradesmus bajacalifornicus</italic> (NC086755), <italic>Tetradesmus dimorphus</italic> (NC086754), <italic>Tetradesmus distendus</italic> (NC086753), <italic>Tetradesmus lancea</italic> (OR502671), <italic>Tetradesmus major</italic> f. <italic>lunatus</italic> (OR502665), <italic>Tetradesmus obliquus</italic> (NC008101), <italic>Tetradesmus obliquus</italic> var. sp<italic>iraliformis</italic> (OR502672), and <italic>Tetradesmus reginae</italic> (NC086752).</p>
<p>All <italic>Coelastrum</italic> strains grown in our laboratory were observed under a light microscope for initial species identification based on morphological criteria, while cells were in exponential growth phase in WC media. Increases in cell abundance were determined by daily fluorescence in 25&#xa0;mm diameter glass tubes in a Turner TD-700<sup>&#xae;</sup> fluorometer. Scanning electron microscopy (SEM) was then utilized to evaluate ultrastructural variation in cell walls among species. Strains were fixed with formaldehyde or glutaraldehyde and dehydrated on a 25&#xa0;mm diameter, 0.2 &#x3bc;m pore size membrane filter. Critical-point dried samples were mounted onto aluminum SEM stubs and coated with iridium using a sputter coater. Cell shape and ultrastructure were examined to confirm identity at the species levels based on authoritative references (<xref ref-type="bibr" rid="B16">Fenwick et&#xa0;al., 1966</xref>; <xref ref-type="bibr" rid="B15">Fenwick, 1968</xref>; <xref ref-type="bibr" rid="B29">Kom&#xe1;rek and Fott, 1983</xref>; <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al., 2010</xref>).</p>
<p>Our identification of publicly available strains matched the names associated with those deposits and the literature. Our identification of our new strains was based upon agreement with the literature and with the morphology of the publicly available strains. We use the term &#x201c;nominal species&#x201d; to emphasize that any classification at any time is a hypothesis.</p>
<p>To obtain DNA, cultures grown in WC medium were harvested in exponential phase, and cells were pelleted by centrifugation at 4,500 rpm for 20&#xa0;min. DNA was extracted from the collected pellets for next-generation sequencing (NGS) using a DNeasy<sup>&#xae;</sup> Plant Mini Kit (Qiagen, Hilden, Germany) following the manufacturers protocol. DNA quantity was measured using the Qubit<sup>&#xae;</sup> double stranded DNA High Sensitivity Assay Kit and the Qubit<sup>&#xae;</sup> 2.0 Fluorometer, while DNA quality was assessed with the NanoDrop<sup>&#xae;</sup> ND-1000 UV-Vis Spectrophotometer.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Plastome sequencing, assembly, and annotation</title>
<p>Total genomic DNA extracted from cultured <italic>Coelastrum</italic> strains was submitted to one of two facilities for high-throughput sequencing: the Genome Sequencing and Analysis Facility (GSAF) at the University of Texas at Austin or to Novogene (Beijing, China). For most strains, short-read sequencing libraries were prepared and sequenced on the Illumina HiSeq 4000 platform (Illumina, San Diego, CA), generating approximately 30 million paired-end reads (150 bp read length) per sample.</p>
<p>Short-read Illumina sequencing failed to yield complete plastome assemblies for three strains&#x2014;SAG 2078, SAG 2248, and SAG 41.86, thus, long-read sequencing was performed on these three strains using the PacBio Sequel II platform with library preparation and sequencing carried out by Novogene.</p>
<p>Adapter sequences and low-quality bases were removed using BBDuk from the BBTools software suite (<ext-link ext-link-type="uri" xlink:href="https://jgi.doe.gov/data-and-tools/bbtools/">https://jgi.doe.gov/data-and-tools/bbtools/</ext-link>). Clean short reads were assembled <italic>de novo</italic> using NOVOPlasty v4.2.1 (<xref ref-type="bibr" rid="B13">Dierckxsens et&#xa0;al., 2017</xref>) on the Texas Advanced Computing Center (TACC) supercomputing platform, using an optimized k-mer size of 33 and an insert size of 300 bp. Long-read data were assembled with ptGAUL (plastid Genome Assembly Using Long reads) (<xref ref-type="bibr" rid="B62">Zhou et&#xa0;al., 2023</xref>), which is specifically designed for accurate reconstruction of plastid genomes from long-read datasets.</p>
<p>All resulting plastome assemblies were imported into Geneious Prime v2020.2.4 (Biomatters Ltd., Auckland, New Zealand). Assembly completeness, gene order, and IR boundaries for newly sequenced strains were examined, and read mapping was performed using BBMap (<xref ref-type="bibr" rid="B8">Bushnell, 2014</xref>) to verify coverage uniformity and support assembly accuracy. Taxonomic verification was conducted using BLAST searches against the NCBI nucleotide database (<xref ref-type="bibr" rid="B1">Altschul et&#xa0;al., 1990</xref>) to detect possible contaminants and confirm species identity. Plastome sequences were annotated in Geneious based on homologous genes from closely related Scenedesmaceae taxa and further validated with tRNAscan-SE v2.0 (<xref ref-type="bibr" rid="B35">Lowe and Chan, 2016</xref>) for tRNA identification and RNAmmer v1.2 (<xref ref-type="bibr" rid="B30">Lagesen et&#xa0;al., 2007</xref>) for rRNA gene prediction.</p>
<p>IR boundaries and annotations for all strains not sequenced by our laboratory followed annotations downloaded from NCBI.</p>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Phylogenetic analysis</title>
<p>Phylogenetic relationships were inferred using protein coding genes (CDSs) shared across all 29 <italic>Coelastrum</italic> plastomes and at least 16 of the 18 outgroup species (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S3</bold></xref>). Coding sequences for these 62 genes were extracted from the annotated plastomes in Geneious. CDS sequences were aligned using MAFFT v. 7.450 (<xref ref-type="bibr" rid="B27">Katoh and Standley, 2013</xref>) with a default setting in Geneious, and the resulting alignment was used for phylogenetic inference. Missing genes were treated as missing data, and maximum likelihood phylogenies were constructed using IQ-TREE2 v1.6.12 (<xref ref-type="bibr" rid="B37">Minh et&#xa0;al., 2020</xref>) with 1,000 bootstrap replicates. The best-fit substitution model, GTR+F+R5, was selected by ModelFinder (<xref ref-type="bibr" rid="B26">Kalyaanamoorthy et&#xa0;al., 2017</xref>). The resulting phylogenetic tree was visualized in FigTree v1.4.3 (<ext-link ext-link-type="uri" xlink:href="http://tree.bio.ed.ac.uk/software/figtree/">http://tree.bio.ed.ac.uk/software/figtree/</ext-link>).</p>
<p>The aligned data matrix is available from the authors upon request.</p>
<p>IR boundaries determined by methods below for newly obtained sequences, and from NCBI annotations for downloaded plastomes, were mapped onto the best ML tree under parsimony.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Intron analyses</title>
<p>Intron presence and distribution were assessed across the newly assembled plastomes of <italic>Coelastrum</italic> strains and <italic>Coelastrum microporum</italic> (NC068582). Intron-containing genes were identified manually from the annotated plastomes using Geneious, and exon-intron boundaries were inferred by alignment with homologous plastid sequences from other <italic>Coelastrum</italic> species and from the related Scenedesmaceae genera <italic>Coelastrella</italic>, <italic>Pectinodesmus</italic>, <italic>Scenedesmus</italic>, and <italic>Tetradesmus</italic> (<xref ref-type="bibr" rid="B11">de Cambiaire et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B58">Wang et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B61">Zhao et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B57">Wang et&#xa0;al., 2024</xref>). To confirm intron identity and detect sequence conservation, all intron sequences were queried against the NCBI nucleotide database using BLAST. For each plastome, the total number of introns and the cumulative intron length (bp) were recorded. Intron variation was tabulated across strains and visualized alongside a maximum likelihood phylogeny to assess patterns of intron gain and loss across <italic>Coelastrum</italic> strains.</p>
<p>To evaluate the relationship between intron variation and overall plastome size, Pearson correlation tests were performed using R v4.3.0. Specifically, correlations were assessed between total intron number and size, and non-coding region size. This analysis aimed to identify which genomic features contribute most significantly to plastome size variation within <italic>Coelastrum</italic>.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Repeat content analysis</title>
<p>Repeat content was analyzed across 29 <italic>Coelastrum</italic> plastomes to evaluate the contribution of repetitive DNA to genome size variation. Prior to analysis, one copy of the inverted repeat (IRA) was removed from each plastome to prevent redundancy. Tandem repeats were detected using Tandem Repeats Finder v.4.09 (<xref ref-type="bibr" rid="B5">Benson, 1999</xref>) via the web interface, with default parameters. The total number and cumulative length of tandem repeats were calculated for each plastome.</p>
<p>Dispersed repeats were detected by running a BLASTN search of each plastome against itself using BLAST v2.16.0+ (<xref ref-type="bibr" rid="B1">Altschul et&#xa0;al., 1990</xref>), with word size of 16 and a minimum identity threshold of 80%, following the methods of <xref ref-type="bibr" rid="B33">Lee et&#xa0;al. (2020)</xref>. Dispersed repeats were identified by retaining BLAST hits whose aligned query and subject regions occurred at distinct, non-overlapping positions within each plastome. Self-hits were removed, and matches representing overlapping or adjacent tandem duplications were excluded to ensure that only dispersed repeats were retained. Total repeats and the proportion of repeat content were calculated for each plastome.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Phylogenetic relationships</title>
<p>Our analysis of plastome data recovered monophyly of all strains of <italic>Coelastrum</italic> with 100% BS support (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1</bold></xref>). Two nominal species were represented by only one strain each: <italic>C. cambricum</italic> (UTEX 2446), and <italic>C. indicum</italic> (SAG 2363). They were recovered along with <italic>C. microporum</italic> (UTEX 281) in a clade with 100% BS support. The latter species was represented by a total of seven strains. The other six were recovered in two separate clades, with strains UTEX 1354, CG1, CW5, and CS5 in one clade and strains CF1 and SAG 2292 in another. In short, plastome data suggested that the morphology associated with <italic>C. microporum</italic> may consist of several independent lineages. A clade comprising <italic>C.</italic> sp<italic>haericum</italic> (SAG 1.82 and SAG 32.81) and <italic>C. proboscideum</italic> (UTEX 184 and UTEX 282) had 100% BS support, but neither nominal species was resolved as monophyletic within this clade.</p>
<p>In contrast, all other nominal species were recovered as monophyletic with high BS support. All <italic>C. reticulatum</italic> strains and all <italic>C. morus</italic> strains were each resolved with 100% BS support and those clades were resolved as sister to one another with 100% BS support. All six <italic>C. astroideum</italic> strains (CW1, CG6, CS1, CS3, CS9, and SAG 33.88) and all four <italic>C. pseudomicroporum</italic> strains (CLB, SAG 2077, UTEX 1353, and UTEX 280) were each recovered as monophyletic with 100% BS support.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Plastome general features</title>
<p>The newly assembled plastome sequences had a mean coverage ranging from 563.1 to 2,847.8X for 150 bp pair-end Illumina reads, and from 56.3 to 116.0X for long-read PacBio sequencing (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). All plastomes were fully annotated and deposited in the NCBI GenBank database, with accession numbers provided in <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>. Each plastome displayed a typical quadripartite structure, consisting of a large single copy (LSC) region and a small single copy (SSC) region with two inverted repeats (IRA and IRB).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Summary of plastome features across <italic>Coelastrum</italic> species.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" colspan="2" align="center">Species</th>
<th valign="middle" rowspan="2" align="center">Strain name</th>
<th valign="middle" rowspan="2" align="center">GenBank</th>
<th valign="middle" rowspan="2" align="center">Average depth of coverage</th>
<th valign="middle" colspan="7" align="center">Size (bp)</th>
<th valign="middle" rowspan="2" align="center">GC content (%)</th>
</tr>
<tr>
<th valign="middle" align="center">Plastome</th>
<th valign="middle" align="center">LSC</th>
<th valign="middle" align="center">SSC</th>
<th valign="middle" align="center">IR</th>
<th valign="middle" align="center">Intron</th>
<th valign="middle" align="center">Coding region</th>
<th valign="middle" align="center">Non-coding</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="29" align="left"><italic>Coelastrum</italic></td>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">CG6</td>
<td valign="middle" align="center">PX512535</td>
<td valign="middle" align="center">1456.6</td>
<td valign="middle" align="center">186,201</td>
<td valign="middle" align="center">82,667</td>
<td valign="middle" align="center">70,148</td>
<td valign="middle" align="center">16,693</td>
<td valign="middle" align="center">13,128</td>
<td valign="middle" align="center">93,889</td>
<td valign="middle" align="center">92,312</td>
<td valign="middle" align="center">31.0</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">CS1</td>
<td valign="middle" align="center">PX512536</td>
<td valign="middle" align="center">771.0</td>
<td valign="middle" align="center">178,665</td>
<td valign="middle" align="center">75,932</td>
<td valign="middle" align="center">65,987</td>
<td valign="middle" align="center">18,373</td>
<td valign="middle" align="center">15,133</td>
<td valign="middle" align="center">93,698</td>
<td valign="middle" align="center">84,967</td>
<td valign="middle" align="center">30.1</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">CS3</td>
<td valign="middle" align="center">PX512537</td>
<td valign="middle" align="center">1605.2</td>
<td valign="middle" align="center">175,331</td>
<td valign="middle" align="center">72,367</td>
<td valign="middle" align="center">66,700</td>
<td valign="middle" align="center">18,132</td>
<td valign="middle" align="center">8,744</td>
<td valign="middle" align="center">94,540</td>
<td valign="middle" align="center">80,791</td>
<td valign="middle" align="center">30.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">CS9</td>
<td valign="middle" align="center">PX512538</td>
<td valign="middle" align="center">563.1</td>
<td valign="middle" align="center">175,332</td>
<td valign="middle" align="center">72,367</td>
<td valign="middle" align="center">66,701</td>
<td valign="middle" align="center">18,132</td>
<td valign="middle" align="center">8,725</td>
<td valign="middle" align="center">94,521</td>
<td valign="middle" align="center">80,811</td>
<td valign="middle" align="center">30.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">CW1</td>
<td valign="middle" align="center">PX512539</td>
<td valign="middle" align="center">1059.8</td>
<td valign="middle" align="center">186,257</td>
<td valign="middle" align="center">82,662</td>
<td valign="middle" align="center">70,147</td>
<td valign="middle" align="center">16,724</td>
<td valign="middle" align="center">13,126</td>
<td valign="middle" align="center">93,862</td>
<td valign="middle" align="center">92,395</td>
<td valign="middle" align="center">31.0</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>astroideum</italic></td>
<td valign="middle" align="center">SAG33.88</td>
<td valign="middle" align="center">PX512540</td>
<td valign="middle" align="center">1472.3</td>
<td valign="middle" align="center">180,843</td>
<td valign="middle" align="center">76,458</td>
<td valign="middle" align="center">66,863</td>
<td valign="middle" align="center">18,761</td>
<td valign="middle" align="center">13,478</td>
<td valign="middle" align="center">94,527</td>
<td valign="middle" align="center">86,316</td>
<td valign="middle" align="center">30.4</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>cambricum</italic></td>
<td valign="middle" align="center">UTEX2446</td>
<td valign="middle" align="center">PX512541</td>
<td valign="middle" align="center">1955.4</td>
<td valign="middle" align="center">171,270</td>
<td valign="middle" align="center">85,045</td>
<td valign="middle" align="center">68,701</td>
<td valign="middle" align="center">8,762</td>
<td valign="middle" align="center">15,872</td>
<td valign="middle" align="center">93,108</td>
<td valign="middle" align="center">78,162</td>
<td valign="middle" align="center">30.6</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">CF1</td>
<td valign="middle" align="center">PX512542</td>
<td valign="middle" align="center">1632.0</td>
<td valign="middle" align="center">166,932</td>
<td valign="middle" align="center">83,536</td>
<td valign="middle" align="center">65,694</td>
<td valign="middle" align="center">8,851</td>
<td valign="middle" align="center">14,692</td>
<td valign="middle" align="center">91,083</td>
<td valign="middle" align="center">75,849</td>
<td valign="middle" align="center">30.8</td>
</tr>
<tr>
<td valign="middle" align="left"><bold><italic>microporum</italic></bold></td>
<td valign="middle" align="center">CG1</td>
<td valign="middle" align="center">NC068582</td>
<td valign="middle" align="center">612.2</td>
<td valign="middle" align="center">169,961</td>
<td valign="middle" align="center">85,914</td>
<td valign="middle" align="center">66,611</td>
<td valign="middle" align="center">8,718</td>
<td valign="middle" align="center">15,400</td>
<td valign="middle" align="center">92,014</td>
<td valign="middle" align="center">77,947</td>
<td valign="middle" align="center">31.2</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">CS5</td>
<td valign="middle" align="center">PX512543</td>
<td valign="middle" align="center">1802.8</td>
<td valign="middle" align="center">168,159</td>
<td valign="middle" align="center">80,353</td>
<td valign="middle" align="center">65,796</td>
<td valign="middle" align="center">11,005</td>
<td valign="middle" align="center">14,523</td>
<td valign="middle" align="center">91,165</td>
<td valign="middle" align="center">76,994</td>
<td valign="middle" align="center">30.9</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">CW5</td>
<td valign="middle" align="center">PX512544</td>
<td valign="middle" align="center">1828.7</td>
<td valign="middle" align="center">168,103</td>
<td valign="middle" align="center">80,344</td>
<td valign="middle" align="center">65,783</td>
<td valign="middle" align="center">10,988</td>
<td valign="middle" align="center">14,524</td>
<td valign="middle" align="center">91,165</td>
<td valign="middle" align="center">76,938</td>
<td valign="middle" align="center">30.9</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">SAG2292</td>
<td valign="middle" align="center">PX512545</td>
<td valign="middle" align="center">1917.7</td>
<td valign="middle" align="center">171,509</td>
<td valign="middle" align="center">85,345</td>
<td valign="middle" align="center">66,488</td>
<td valign="middle" align="center">9,838</td>
<td valign="middle" align="center">20,746</td>
<td valign="middle" align="center">91,053</td>
<td valign="middle" align="center">80,456</td>
<td valign="middle" align="center">31.1</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">UTEX281</td>
<td valign="middle" align="center">PX512546</td>
<td valign="middle" align="center">1363.4</td>
<td valign="middle" align="center">186,093</td>
<td valign="middle" align="center">98,646</td>
<td valign="middle" align="center">72,147</td>
<td valign="middle" align="center">7,650</td>
<td valign="middle" align="center">11,169</td>
<td valign="middle" align="center">93,335</td>
<td valign="middle" align="center">92,758</td>
<td valign="middle" align="center">30.9</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>microporum</italic></td>
<td valign="middle" align="center">UTEX1354</td>
<td valign="middle" align="center">PX512547</td>
<td valign="middle" align="center">1571.6</td>
<td valign="middle" align="center">170,796</td>
<td valign="middle" align="center">80,475</td>
<td valign="middle" align="center">65,797</td>
<td valign="middle" align="center">12,262</td>
<td valign="middle" align="center">17,216</td>
<td valign="middle" align="center">91,165</td>
<td valign="middle" align="center">79,631</td>
<td valign="middle" align="center">31.0</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>morus</italic></td>
<td valign="middle" align="center">SAG2078</td>
<td valign="middle" align="center">PX512671</td>
<td valign="middle" align="center">116.0</td>
<td valign="middle" align="center">298,895</td>
<td valign="middle" align="center">139,858</td>
<td valign="middle" align="center">87,785</td>
<td valign="middle" align="center">35,626</td>
<td valign="middle" align="center">25,873</td>
<td valign="middle" align="center">94,381</td>
<td valign="middle" align="center">204,514</td>
<td valign="middle" align="center">27.4</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>morus</italic></td>
<td valign="middle" align="center">SAG2248</td>
<td valign="middle" align="center">PX512672</td>
<td valign="middle" align="center">102.5</td>
<td valign="middle" align="center">552,967</td>
<td valign="middle" align="center">223,506</td>
<td valign="middle" align="center">199,160</td>
<td valign="middle" align="center">65,144</td>
<td valign="middle" align="center">67,640</td>
<td valign="middle" align="center">98,170</td>
<td valign="middle" align="center">454,797</td>
<td valign="middle" align="center">30.5</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>morus</italic></td>
<td valign="middle" align="center">SAG41.86</td>
<td valign="middle" align="center">PX512673</td>
<td valign="middle" align="center">56.3</td>
<td valign="middle" align="center">553,457</td>
<td valign="middle" align="center">224,087</td>
<td valign="middle" align="center">199,103</td>
<td valign="middle" align="center">65,144</td>
<td valign="middle" align="center">67,640</td>
<td valign="middle" align="center">98,170</td>
<td valign="middle" align="center">455,287</td>
<td valign="middle" align="center">30.5</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>proboscideum</italic> var. <italic>dilatatum</italic></td>
<td valign="middle" align="center">UTEX282</td>
<td valign="middle" align="center">PX512548</td>
<td valign="middle" align="center">1783.9</td>
<td valign="middle" align="center">203,945</td>
<td valign="middle" align="center">103,673</td>
<td valign="middle" align="center">80,474</td>
<td valign="middle" align="center">9,899</td>
<td valign="middle" align="center">18,490</td>
<td valign="middle" align="center">93,866</td>
<td valign="middle" align="center">110,079</td>
<td valign="middle" align="center">30.1</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>proboscideum</italic> var. <italic>gracile</italic></td>
<td valign="middle" align="center">UTEX184</td>
<td valign="middle" align="center">PX512549</td>
<td valign="middle" align="center">1365.4</td>
<td valign="middle" align="center">208,184</td>
<td valign="middle" align="center">103,669</td>
<td valign="middle" align="center">79,203</td>
<td valign="middle" align="center">12,656</td>
<td valign="middle" align="center">18,487</td>
<td valign="middle" align="center">92,993</td>
<td valign="middle" align="center">115,191</td>
<td valign="middle" align="center">30.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>pseudomicroporum</italic></td>
<td valign="middle" align="center">CLB</td>
<td valign="middle" align="center">PX512550</td>
<td valign="middle" align="center">1957.2</td>
<td valign="middle" align="center">179,623</td>
<td valign="middle" align="center">89,320</td>
<td valign="middle" align="center">68,767</td>
<td valign="middle" align="center">10,768</td>
<td valign="middle" align="center">29,032</td>
<td valign="middle" align="center">91,022</td>
<td valign="middle" align="center">88,601</td>
<td valign="middle" align="center">32.1</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>pseudomicroporum</italic></td>
<td valign="middle" align="center">SAG2077</td>
<td valign="middle" align="center">PX512551</td>
<td valign="middle" align="center">2847.8</td>
<td valign="middle" align="center">167,559</td>
<td valign="middle" align="center">84,152</td>
<td valign="middle" align="center">65,347</td>
<td valign="middle" align="center">9,030</td>
<td valign="middle" align="center">16,714</td>
<td valign="middle" align="center">91,021</td>
<td valign="middle" align="center">76,538</td>
<td valign="middle" align="center">31.4</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>pseudomicroporum</italic></td>
<td valign="middle" align="center">UTEX280</td>
<td valign="middle" align="center">PX512552</td>
<td valign="middle" align="center">2189.6</td>
<td valign="middle" align="center">167,578</td>
<td valign="middle" align="center">84,254</td>
<td valign="middle" align="center">65,204</td>
<td valign="middle" align="center">9,060</td>
<td valign="middle" align="center">16,647</td>
<td valign="middle" align="center">91,090</td>
<td valign="middle" align="center">76,488</td>
<td valign="middle" align="center">31.4</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>pseudomicroporum</italic></td>
<td valign="middle" align="center">UTEX1353</td>
<td valign="middle" align="center">PX512553</td>
<td valign="middle" align="center">1345.4</td>
<td valign="middle" align="center">166,827</td>
<td valign="middle" align="center">82,056</td>
<td valign="middle" align="center">64,851</td>
<td valign="middle" align="center">9,960</td>
<td valign="middle" align="center">16,222</td>
<td valign="middle" align="center">91,082</td>
<td valign="middle" align="center">75,745</td>
<td valign="middle" align="center">31.9</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>pseudomicroporum</italic></td>
<td valign="middle" align="center">SAG2363</td>
<td valign="middle" align="center">PX512554</td>
<td valign="middle" align="center">1993.9</td>
<td valign="middle" align="center">198,867</td>
<td valign="middle" align="center">90,540</td>
<td valign="middle" align="center">69,579</td>
<td valign="middle" align="center">19,374</td>
<td valign="middle" align="center">28,366</td>
<td valign="middle" align="center">95,196</td>
<td valign="middle" align="center">103,671</td>
<td valign="middle" align="center">30.5</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>reticulatum</italic></td>
<td valign="middle" align="center">CG10</td>
<td valign="middle" align="center">PX512555</td>
<td valign="middle" align="center">664.8</td>
<td valign="middle" align="center">200,459</td>
<td valign="middle" align="center">107,222</td>
<td valign="middle" align="center">74,859</td>
<td valign="middle" align="center">9,189</td>
<td valign="middle" align="center">9,580</td>
<td valign="middle" align="center">93,038</td>
<td valign="middle" align="center">107,421</td>
<td valign="middle" align="center">29.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>reticulatum</italic></td>
<td valign="middle" align="center">SAG8.81</td>
<td valign="middle" align="center">PX512556</td>
<td valign="middle" align="center">1410.4</td>
<td valign="middle" align="center">193,431</td>
<td valign="middle" align="center">95,451</td>
<td valign="middle" align="center">73,942</td>
<td valign="middle" align="center">12,019</td>
<td valign="middle" align="center">16,782</td>
<td valign="middle" align="center">93,651</td>
<td valign="middle" align="center">99,780</td>
<td valign="middle" align="center">29.1</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>reticulatum</italic></td>
<td valign="middle" align="center">UTEX1365</td>
<td valign="middle" align="center">PX512557</td>
<td valign="middle" align="center">1035.7</td>
<td valign="middle" align="center">242,214</td>
<td valign="middle" align="center">92,255</td>
<td valign="middle" align="center">58,315</td>
<td valign="middle" align="center">45,822</td>
<td valign="middle" align="center">16,288</td>
<td valign="middle" align="center">89,638</td>
<td valign="middle" align="center">152,576</td>
<td valign="middle" align="center">30.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>sphaericum</italic></td>
<td valign="middle" align="center">SAG1.82</td>
<td valign="middle" align="center">PX512558</td>
<td valign="middle" align="center">1035.9</td>
<td valign="middle" align="center">208,400</td>
<td valign="middle" align="center">103,667</td>
<td valign="middle" align="center">79,319</td>
<td valign="middle" align="center">12,707</td>
<td valign="middle" align="center">18,488</td>
<td valign="middle" align="center">93,122</td>
<td valign="middle" align="center">115,278</td>
<td valign="middle" align="center">30.3</td>
</tr>
<tr>
<td valign="middle" align="left"><italic>sphaericum</italic></td>
<td valign="middle" align="center">SAG32.81</td>
<td valign="middle" align="center">PX512559</td>
<td valign="middle" align="center">1124.2</td>
<td valign="middle" align="center">208,308</td>
<td valign="middle" align="center">103,672</td>
<td valign="middle" align="center">79,186</td>
<td valign="middle" align="center">12,725</td>
<td valign="middle" align="center">18,489</td>
<td valign="middle" align="center">93,122</td>
<td valign="middle" align="center">115,186</td>
<td valign="middle" align="center">30.3</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Genomes obtained from NCBI are indicated by species names in bold.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>Despite this conserved structural organization, plastome sizes showed substantial interspecific variation, ranging from 166,827 bp in <italic>Coelastrum pseudomicroporum</italic> (UTEX 1353) to 553,457 bp in <italic>Coelastrum morus</italic> (SAG 41.86) (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref> and <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). The size of the single copy regions ranged from 137,407 bp to 423,190 bp (approximately a threefold range), whereas IR size ranged from 7,650bp to 65,144 bp, representing more than an eightfold range. These regions corresponded to 8.2% and 37.84% of total plastome size, respectively.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Phylogenetic relationships and plastome structural variation among 29 <italic>Coelastrum</italic> strains. The cladogram is based on the phylogram shown in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S1</bold></xref>. Bootstrap values less than 100% are indicated at the nodes. Variety names (<italic>Coelastrum proboscideum</italic> var. <italic>gracile</italic> UTEX184; <italic>C. proboscideum</italic> var. <italic>dilatatum</italic> UTEX282) were omitted from the figure labels for conciseness. Colored markers denote gene and tRNA losses mapped onto the relevant branches. Plastome, LSC, SSC and IR variation are indicated in bp (see also <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1736783-g001.tif">
<alt-text content-type="machine-generated">Phylogenetic tree of Coelastrum species showing gene loss and tRNA loss. Strains are listed with corresponding plastome sizes in green, large single-copy regions in orange, small single-copy regions in blue, and inverted repeat regions in gray. Gene losses are marked in red and tRNA losses in green. Scale indicates branch length.</alt-text>
</graphic></fig>
<p>There were 4 types of inverted repeat boundaries (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>). Inverted repeat expansion in certain lineages resulted in the translocation of four genes (<italic>psbC</italic>, <italic>atpF</italic>, <italic>atpH</italic>, and <italic>ftsH</italic>) across the LSC and the IR region. In Type 1, <italic>psbC</italic> was positioned in the LSC region near the IRB-LSC junction in the <italic>C. morus</italic> clade and in <italic>C. reticulatum</italic> CG10. It was also found in <italic>C. cambricum</italic> and all <italic>C. microporum</italic> and <italic>C. pseudomicroporum</italic>. The Type 2 boundary is similar, with the IR boundary bisecting the <italic>psbC</italic> gene, and was found in two <italic>C. reticulatum</italic> strains (SAG 8.81 and UTEX 1365) and in the <italic>C.</italic> sp<italic>haericum</italic> -&#xa0;C<italic>. proboscideum</italic> clade. Type 3 was restricted to <italic>C. indicum</italic> which retained <italic>psbC</italic> and <italic>atpF</italic> genes in the LSC but <italic>atpH</italic> and <italic>ftsH</italic> genes were found in the IRB region. Type 4 had a partial duplication of the <italic>ftsH</italic> gene within the IRB region of <italic>C. astroideum</italic>. Outgroup plastomes nearly all had the Type 1 boundary. <italic>Pectinodesmus pectinatus</italic> (NC036668) and <italic>Tetradesmus obliquus</italic> (NC008101) had Type 2 boundaries. <italic>Crucigenia lauterbornii</italic> (PP979532) and <italic>Coronastrum ellipsoideum</italic> (PP979513) had very different IR boundaries than any of the other plastomes. Regardless of where one might draw the root among outgroups, Type 1 still maps unambiguously as plesiomorphic to all of <italic>Coelastrum</italic>.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Inverted repeat (IR) boundary variation across major <italic>Coelastrum</italic> clades. Left: Phylogenetic tree of 29 <italic>Coelastrum</italic> strains and three outgroups, with branch colors indicating distinct IR structures. Right: Representative plastome maps showing IRB&#x2013;LSC boundaries, with gene positions and duplications linked to IR expansion. Colors match the clades in the tree.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1736783-g002.tif">
<alt-text content-type="machine-generated">Phylogenetic tree diagram illustrating relationships of Coelastrum strains of four different types of boundaries between the inverted repeat region B (IRB) and large-single copy (LSC) region. This is illustrated by the location of four genes, psbC, atpF, atpH, and ftsH. All four genes are in the LSC in Type 1 (black branches). The psbC gene overlaps the IRB-LSC boundary in Type 2 (blue branches). The psbC and atpF genes are in the IRB in Type 3 (yellow branch). These two genes plus the atpH gene are in the IRB, and ftsH overlaps both regions in Type 4 (green branches).</alt-text>
</graphic></fig>
<p>The total coding region length ranged from 89,638 bp to 98,170 bp (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). Overall GC content across the genus was relatively consistent, ranging from 29.1% to 32.1%. However, one <italic>C. morus</italic> strain showed a lower GC content of 27.4%. In contrast, non-coding regions varied across strains, from 75,745 bp to 455,287 bp, comprising up to 82.3% of the total plastome length. This variation in non-coding content likely plays a central role in the plastome size differences observed among <italic>Coelastrum</italic> strains. To investigate the potential origins of the expanded intergenic regions in <italic>C. morus</italic>, we performed BLAST searches using representative intergenic sequences. These searches yielded no significant matches.</p>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Gene loss and intron variation</title>
<p>Comparative analyses of gene content across 29 <italic>Coelastrum</italic> plastomes revealed overall conservation in core gene composition, with the exception of minor variation in tRNA gene content (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Table S1</bold></xref>). The most pronounced case of gene loss was observed in <italic>Coelastrum reticulatum</italic> (UTEX 1365), which lacked five contiguous genes, <italic>clpP</italic>, <italic>rpl2</italic>, <italic>rpl23</italic>, <italic>rps4</italic>, and <italic>rps19</italic>, that are typically co-localized within the small single copy (SSC) region in other <italic>Coelastrum</italic> strains (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref>). This does not appear to be an artefact as coverage was deep and uniform across the region of interest (<xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S3</bold></xref>). In addition, <italic>trnF</italic>-GAA and <italic>trnL</italic>-TAG were also absent in this strain, suggesting either a localized deletion event or significant genomic rearrangement in the SSC region. Independent tRNA gene losses were detected in two additional strains: <italic>trnR</italic>-UCU was absent in <italic>C. reticulatum</italic> (SAG 8.81), and <italic>trnS</italic>-GCU was missing from <italic>C. proboscideum</italic> (UTEX 282).</p>
<p>Across the 29 assembled <italic>Coelastrum</italic> plastomes, intron distribution showed considerable heterogeneity in both location and frequency, reflecting dynamic evolutionary events. A total of 13 genes were identified as intron-bearing, with <italic>psaA</italic>, <italic>psbA</italic>, <italic>psbC</italic>, <italic>rbcL</italic>, and <italic>rrn23</italic> exhibiting the greatest variability in intron content and length (<xref ref-type="fig" rid="f3"><bold>Figure&#xa0;3</bold></xref>). The <italic>psaA</italic> gene consistently displayed a trans-spliced structure with introns separating three exons. The cis-spliced configuration was observed in most <italic>Coelastrum</italic> strains.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Heatmap of the number of introns across plastid genes for <italic>Coelastrum</italic> species. Numbers within cells denote the number of introns in each gene, while blank cells indicate the absence of introns.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1736783-g003.tif">
<alt-text content-type="machine-generated">Heatmap displaying presence and number of introns in Coelastrum strains used in this study. Rows represent strains, and columns indicate number of introns within each indicated gene (bottom line). The number in each cell represents the number of introns in a specific gene for a specific strain. Darker shades of blue represent more introns per gene (up to 12 for the darkest blue). White blank cells indicate the absence of introns in that gene.</alt-text>
</graphic></fig>
<p>Unique intron insertions were identified in several genes across the <italic>Coelastrum</italic> plastomes. Notably, an intron at position 66 in the <italic>psbE</italic> gene was detected in two of the three <italic>C</italic>. <italic>morus</italic> strains, but was absent in the third strain, indicating strain-specific intron retention or loss within the species. The <italic>psbZ</italic> intron (position 65) was observed only in <italic>C. cambricum</italic>, suggesting this to be a unique insertion event within <italic>Coelastrum</italic>. The <italic>atpA</italic> intron, located at site 489, was present in three strains of <italic>C. astroideum</italic> that did not form monophyletic group and one strain of <italic>C. microporum</italic> (UTEX 2446) in an unrelated clade. The canonical group I intron within <italic>trnL</italic>-UAA was conserved across all sampled plastomes, consistent with its widely reported vertical inheritance and evolutionary stability within Chlorophyta.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Plastome size variation</title>
<p>Four strains were outliers in terms of overall plastome size (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). The two largest plastomes belonged to two <italic>C. morus</italic> strains (SAG 2248 and SAG 41.86). They were nearly identical in size to each other but were 85% larger than the third <italic>C. morus</italic> strain SAG 2078, which was 23% larger than that of <italic>C. reticulatum</italic> UTEX 1365. The latter was 16% larger than the next largest. After that, there was never more than a 4% difference in plastome size between any two strains. The reporting that follows refers to these four largest strains as the outliers, or as the four large strains.</p>
<p>There was relatively little variation in coding region size whether or not one considered outliers. For example, the coefficient of variation of the aggregate size of coding regions (from both single copy regions plus one IR copy) was about 2.2% with outliers and 1.5% without outliers (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). The largest absolute contributor to plastome size was the non-coding region size which accounted for over 99% of the variation in total genome size whether or not outlier strains were included (r = 0.99, p &lt; 0.001; <xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4A, B</bold></xref>).</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Pearson correlation between plastome size and key genomic features in <italic>Coelastrum</italic> strains with and without outliers defined in the text as <italic>C. morus</italic> strains SAG 2078, SAG 2248, and SAG 41.86, and <italic>C. reticulatum</italic> UTEX 1365 (N&#xa0;=&#xa0;29; N&#xa0;=&#xa0;25 respectively). Blue lines represent linear regression fits with 95% confidence intervals in gray shading. Pearson correlation coefficients (r) and p-values are shown in each graph. <bold>(A, B)</bold> Aggregate non-coding region size versus plastome size; <bold>(C, D)</bold> Number of introns versus aggregate non-coding region size; <bold>(E, F)</bold> Intron size versus aggregate non-coding region size; <bold>(G, H)</bold> Number of repeats versus aggregate non-coding region size; <bold>(I, J)</bold> Repeat size versus aggregate non-coding region size; <bold>(K, L)</bold> IR size versus plastome size; <bold>(M, N)</bold> Non-coding region size in IRA versus total IRA size.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-17-1736783-g004.tif">
<alt-text content-type="machine-generated">Fourteen scatter plots labeled A to N show correlations between variables like plastome size, non-coding region size, number of introns, number of repeats, and repeat size. Each plot includes a trend line and correlation coefficients (r values) with significance (p-values). Sample sizes vary, indicated by N values, and shaded regions represent confidence intervals.</alt-text>
</graphic></fig>
<p>We then analyzed contribution of various elements to aggregate non-coding region size. With outlier strains included, intron number and aggregate intron size were each positively correlated to non-coding size (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4C, E</bold></xref>) but removal of the outliers left no significant correlation (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4D, F</bold></xref>). However, regardless of whether or not outliers were included, total number and aggregate size of repeated elements were correlated with aggregate non-coding region size (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4G-J</bold></xref>).</p>
<p>That repeat elements were important contributors to size variation in all strains warranted more detailed investigation of these elements. Across the 29 <italic>Coelastrum</italic> plastomes, both dispersed and tandem repeats exhibited lineage-specific variation (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). Repeat content was typically limited to 1&#x2013;5 dispersed repeats per plastome, typically totaling &lt;1,000 bp and contributing &lt;0.5% of the genome. Tandem repeats in these compact plastomes were likewise limited, generally numbering fewer than 40 and spanning &lt;2,000 bp, corresponding to &lt;1% of total plastome size. In sharp contrast, repeat proliferation was dramatic in the <italic>C. morus</italic> lineage. The two giant plastomes, SAG 2248 and SAG 41.86, contained more than 26,000 dispersed repeats, representing ~200 kb of sequence and accounting for ~41% of their genome size. These same strains also harbored exceptionally high levels of tandem repeats, each exceeding 400 elements and ~53,000 bp in total length (~10% of the genome). Altogether, repetitive DNA surpassed 250 kb in these plastomes, contributing more than 50% of total genome size, whereas all other <italic>Coelastrum</italic> plastomes contained &lt;5% repetitive DNA. Intermediate cases, such as <italic>C. reticulatum</italic> (UTEX 1365) and <italic>C. morus</italic> (SAG 2078), exhibited moderate repeat proliferation (100&#x2013;120 dispersed repeats; ~7.5&#x2013;8 kb), suggesting that repeat accumulation may have occurred in a stepwise and lineage-specific manner. These results again highlight repetitive DNA, both dispersed and tandem repeats, as a major driver of the genome size variation observed within <italic>Coelastrum</italic>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Dispersed and tandem repeat contents across 29 <italic>Coelastrum</italic> plastomes.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" align="center">Strain name</th>
<th valign="middle" rowspan="2" align="center">Plastome size (removed IRA)</th>
<th valign="middle" colspan="3" align="center">Dispersed repeat</th>
<th valign="middle" colspan="3" align="center">Tandem repeat</th>
<th valign="middle" colspan="3" align="center">Total repeat</th>
</tr>
<tr>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Total length (bp)</th>
<th valign="middle" align="center">Content (%)</th>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Total length (bp)</th>
<th valign="middle" align="center">Content (%)</th>
<th valign="middle" align="center">Number</th>
<th valign="middle" align="center">Length (bp)</th>
<th valign="middle" align="center">Content (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">UTEX1353</td>
<td valign="middle" align="center">156,867</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">200</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">22</td>
<td valign="middle" align="center">886</td>
<td valign="middle" align="center">0.6</td>
<td valign="middle" align="center">23</td>
<td valign="middle" align="center">1,086</td>
<td valign="middle" align="center">0.7</td>
</tr>
<tr>
<td valign="middle" align="center">CF1</td>
<td valign="middle" align="center">158,081</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">154</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">26</td>
<td valign="middle" align="center">1,178</td>
<td valign="middle" align="center">0.7</td>
<td valign="middle" align="center">27</td>
<td valign="middle" align="center">1,332</td>
<td valign="middle" align="center">0.8</td>
</tr>
<tr>
<td valign="middle" align="center">SAG2077</td>
<td valign="middle" align="center">158,529</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">159</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">36</td>
<td valign="middle" align="center">1,485</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">1,644</td>
<td valign="middle" align="center">1.0</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX280</td>
<td valign="middle" align="center">158,518</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">159</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">36</td>
<td valign="middle" align="center">1,493</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">37</td>
<td valign="middle" align="center">1,652</td>
<td valign="middle" align="center">1.0</td>
</tr>
<tr>
<td valign="middle" align="center">CW5</td>
<td valign="middle" align="center">157,115</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">148</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">25</td>
<td valign="middle" align="center">968</td>
<td valign="middle" align="center">0.6</td>
<td valign="middle" align="center">26</td>
<td valign="middle" align="center">1,116</td>
<td valign="middle" align="center">0.7</td>
</tr>
<tr>
<td valign="middle" align="center">CS5</td>
<td valign="middle" align="center">157,154</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">148</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">25</td>
<td valign="middle" align="center">1,020</td>
<td valign="middle" align="center">0.6</td>
<td valign="middle" align="center">26</td>
<td valign="middle" align="center">1,168</td>
<td valign="middle" align="center">0.7</td>
</tr>
<tr>
<td valign="middle" align="center">CG1</td>
<td valign="middle" align="center">161,243</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">191</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">28</td>
<td valign="middle" align="center">1,262</td>
<td valign="middle" align="center">0.8</td>
<td valign="middle" align="center">29</td>
<td valign="middle" align="center">1,453</td>
<td valign="middle" align="center">0.9</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX1354</td>
<td valign="middle" align="center">158,534</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">148</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">25</td>
<td valign="middle" align="center">979</td>
<td valign="middle" align="center">0.6</td>
<td valign="middle" align="center">26</td>
<td valign="middle" align="center">1,127</td>
<td valign="middle" align="center">0.7</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX2446</td>
<td valign="middle" align="center">162,508</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">171</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">21</td>
<td valign="middle" align="center">834</td>
<td valign="middle" align="center">0.5</td>
<td valign="middle" align="center">22</td>
<td valign="middle" align="center">1,005</td>
<td valign="middle" align="center">0.6</td>
</tr>
<tr>
<td valign="middle" align="center">SAG2292</td>
<td valign="middle" align="center">161,671</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">236</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">20</td>
<td valign="middle" align="center">788</td>
<td valign="middle" align="center">0.5</td>
<td valign="middle" align="center">21</td>
<td valign="middle" align="center">1,024</td>
<td valign="middle" align="center">0.6</td>
</tr>
<tr>
<td valign="middle" align="center">CS3</td>
<td valign="middle" align="center">157,199</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">154</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">15</td>
<td valign="middle" align="center">555</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">16</td>
<td valign="middle" align="center">709</td>
<td valign="middle" align="center">0.5</td>
</tr>
<tr>
<td valign="middle" align="center">CS9</td>
<td valign="middle" align="center">157,200</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">154</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">16</td>
<td valign="middle" align="center">589</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">17</td>
<td valign="middle" align="center">743</td>
<td valign="middle" align="center">0.5</td>
</tr>
<tr>
<td valign="middle" align="center">CS1</td>
<td valign="middle" align="center">160,292</td>
<td valign="middle" align="center">2</td>
<td valign="middle" align="center">279</td>
<td valign="middle" align="center">0.2</td>
<td valign="middle" align="center">16</td>
<td valign="middle" align="center">682</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">18</td>
<td valign="middle" align="center">961</td>
<td valign="middle" align="center">0.6</td>
</tr>
<tr>
<td valign="middle" align="center">CLB</td>
<td valign="middle" align="center">168,855</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">200</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">29</td>
<td valign="middle" align="center">1,267</td>
<td valign="middle" align="center">0.8</td>
<td valign="middle" align="center">30</td>
<td valign="middle" align="center">1,467</td>
<td valign="middle" align="center">0.9</td>
</tr>
<tr>
<td valign="middle" align="center">SAG33.88</td>
<td valign="middle" align="center">162,082</td>
<td valign="middle" align="center">5</td>
<td valign="middle" align="center">578</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">22</td>
<td valign="middle" align="center">923</td>
<td valign="middle" align="center">0.6</td>
<td valign="middle" align="center">27</td>
<td valign="middle" align="center">1,501</td>
<td valign="middle" align="center">0.9</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX281</td>
<td valign="middle" align="center">178,443</td>
<td valign="middle" align="center">1</td>
<td valign="middle" align="center">146</td>
<td valign="middle" align="center">0.1</td>
<td valign="middle" align="center">38</td>
<td valign="middle" align="center">1,916</td>
<td valign="middle" align="center">1.1</td>
<td valign="middle" align="center">39</td>
<td valign="middle" align="center">2,062</td>
<td valign="middle" align="center">1.2</td>
</tr>
<tr>
<td valign="middle" align="center">CG6</td>
<td valign="middle" align="center">169,508</td>
<td valign="middle" align="center">5</td>
<td valign="middle" align="center">716</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">20</td>
<td valign="middle" align="center">1,110</td>
<td valign="middle" align="center">0.7</td>
<td valign="middle" align="center">25</td>
<td valign="middle" align="center">1,826</td>
<td valign="middle" align="center">1.1</td>
</tr>
<tr>
<td valign="middle" align="center">CW1</td>
<td valign="middle" align="center">169,533</td>
<td valign="middle" align="center">5</td>
<td valign="middle" align="center">716</td>
<td valign="middle" align="center">0.4</td>
<td valign="middle" align="center">20</td>
<td valign="middle" align="center">1,177</td>
<td valign="middle" align="center">0.7</td>
<td valign="middle" align="center">25</td>
<td valign="middle" align="center">1,893</td>
<td valign="middle" align="center">1.1</td>
</tr>
<tr>
<td valign="middle" align="center">SAG8.81</td>
<td valign="middle" align="center">181,412</td>
<td valign="middle" align="center">8</td>
<td valign="middle" align="center">840</td>
<td valign="middle" align="center">0.5</td>
<td valign="middle" align="center">69</td>
<td valign="middle" align="center">3,337</td>
<td valign="middle" align="center">1.8</td>
<td valign="middle" align="center">77</td>
<td valign="middle" align="center">4,177</td>
<td valign="middle" align="center">2.3</td>
</tr>
<tr>
<td valign="middle" align="center">SAG2363</td>
<td valign="middle" align="center">179,421</td>
<td valign="middle" align="center">2</td>
<td valign="middle" align="center">274</td>
<td valign="middle" align="center">0.2</td>
<td valign="middle" align="center">32</td>
<td valign="middle" align="center">1,454</td>
<td valign="middle" align="center">0.8</td>
<td valign="middle" align="center">34</td>
<td valign="middle" align="center">1,728</td>
<td valign="middle" align="center">1.0</td>
</tr>
<tr>
<td valign="middle" align="center">CG10</td>
<td valign="middle" align="center">191,270</td>
<td valign="middle" align="center">9</td>
<td valign="middle" align="center">1,737</td>
<td valign="middle" align="center">0.9</td>
<td valign="middle" align="center">75</td>
<td valign="middle" align="center">3,110</td>
<td valign="middle" align="center">1.6</td>
<td valign="middle" align="center">84</td>
<td valign="middle" align="center">4,847</td>
<td valign="middle" align="center">2.5</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX282</td>
<td valign="middle" align="center">194,046</td>
<td valign="middle" align="center">49</td>
<td valign="middle" align="center">3,766</td>
<td valign="middle" align="center">1.9</td>
<td valign="middle" align="center">46</td>
<td valign="middle" align="center">3,471</td>
<td valign="middle" align="center">1.8</td>
<td valign="middle" align="center">95</td>
<td valign="middle" align="center">7,237</td>
<td valign="middle" align="center">3.7</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX184</td>
<td valign="middle" align="center">195,528</td>
<td valign="middle" align="center">53</td>
<td valign="middle" align="center">4,309</td>
<td valign="middle" align="center">2.2</td>
<td valign="middle" align="center">60</td>
<td valign="middle" align="center">3,267</td>
<td valign="middle" align="center">1.7</td>
<td valign="middle" align="center">113</td>
<td valign="middle" align="center">7,576</td>
<td valign="middle" align="center">3.9</td>
</tr>
<tr>
<td valign="middle" align="center">SAG32.81</td>
<td valign="middle" align="center">195,583</td>
<td valign="middle" align="center">65</td>
<td valign="middle" align="center">4,446</td>
<td valign="middle" align="center">2.3</td>
<td valign="middle" align="center">59</td>
<td valign="middle" align="center">3,280</td>
<td valign="middle" align="center">1.7</td>
<td valign="middle" align="center">124</td>
<td valign="middle" align="center">7,726</td>
<td valign="middle" align="center">4.0</td>
</tr>
<tr>
<td valign="middle" align="center">SAG1.82</td>
<td valign="middle" align="center">195,693</td>
<td valign="middle" align="center">62</td>
<td valign="middle" align="center">4,533</td>
<td valign="middle" align="center">2.3</td>
<td valign="middle" align="center">61</td>
<td valign="middle" align="center">3,481</td>
<td valign="middle" align="center">1.8</td>
<td valign="middle" align="center">123</td>
<td valign="middle" align="center">8,014</td>
<td valign="middle" align="center">4.1</td>
</tr>
<tr>
<td valign="middle" align="center">UTEX1365</td>
<td valign="middle" align="center">196,392</td>
<td valign="middle" align="center">179</td>
<td valign="middle" align="center">7,627</td>
<td valign="middle" align="center">3.9</td>
<td valign="middle" align="center">100</td>
<td valign="middle" align="center">5,043</td>
<td valign="middle" align="center">2.6</td>
<td valign="middle" align="center">279</td>
<td valign="middle" align="center">12,670</td>
<td valign="middle" align="center">6.5</td>
</tr>
<tr>
<td valign="middle" align="center">SAG2078</td>
<td valign="middle" align="center">263,269</td>
<td valign="middle" align="center">975</td>
<td valign="middle" align="center">71,475</td>
<td valign="middle" align="center">27.1</td>
<td valign="middle" align="center">121</td>
<td valign="middle" align="center">8,151</td>
<td valign="middle" align="center">3.1</td>
<td valign="middle" align="center">1,096</td>
<td valign="middle" align="center">79,626</td>
<td valign="middle" align="center">30.2</td>
</tr>
<tr>
<td valign="middle" align="center">SAG2248</td>
<td valign="middle" align="center">487,823</td>
<td valign="middle" align="center">26,446</td>
<td valign="middle" align="center">200,674</td>
<td valign="middle" align="center">41.1</td>
<td valign="middle" align="center">420</td>
<td valign="middle" align="center">53,018</td>
<td valign="middle" align="center">10.9</td>
<td valign="middle" align="center">26,866</td>
<td valign="middle" align="center">253,692</td>
<td valign="middle" align="center">52.0</td>
</tr>
<tr>
<td valign="middle" align="center">SAG41.86</td>
<td valign="middle" align="center">488,313</td>
<td valign="middle" align="center">26,436</td>
<td valign="middle" align="center">201,245</td>
<td valign="middle" align="center">41.2</td>
<td valign="middle" align="center">421</td>
<td valign="middle" align="center">53,322</td>
<td valign="middle" align="center">10.9</td>
<td valign="middle" align="center">26,857</td>
<td valign="middle" align="center">254,567</td>
<td valign="middle" align="center">52.1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Samples are arranged in order of increasing plastome size. Total length of dispersed repeats is the total number of base pair sites occupied by all dispersed repeats.</p></fn>
</table-wrap-foot>
</table-wrap>
<p>The four outliers in overall plastome size also had the four largest IR sizes (<xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). Size of the IR was positively correlated with total plastome size when outliers were included (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4K</bold></xref>), but not when outliers were excluded (<xref ref-type="fig" rid="f4"><bold>Figure&#xa0;4L</bold></xref>). As for the entire plastome, non-coding DNA in the IR was positively correlated with IR size whether or not outliers were included (<xref ref-type="fig" rid="f4"><bold>Figures&#xa0;4M, N</bold></xref>).</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<label>4</label>
<title>Discussion</title>
<p>Comparative analyses of complete plastomes for 29 <italic>Coelastrum</italic> strains provide insight into their evolution. The plastomes exhibit a typical quadripartite structure, but vary in total size, non-coding region content, and IR length. This strain-level plastome dataset suggests new insights into the structural, evolutionary, and phylogenetic diversity within <italic>Coelastrum</italic>.</p>
<p>We reiterate that we use the term &#x201c;nominal species&#x201d; to indicate that any classification is a hypothesis given the data at hand. Application of plastome data to Scenedesmaceae has thus far focused on higher level taxonomic relationships. Our application of plastome data to multiple strains of several <italic>Coelastrum</italic> nominal species speaks not only to higher level classification in the Scenedesmaceae but may also have revealed new evidence for cryptic species in <italic>Coelastrum</italic>.</p>
<sec id="s4_1">
<label>4.1</label>
<title>Plastome size variation and causes of expansion</title>
<p>Our study reveals a nearly 3.3-fold variation in plastome size within <italic>Coelastrum</italic>, ranging from 166,827 bp in <italic>C. pseudomicroporum</italic> (UTEX 1353) to 553,457 bp in <italic>C. morus</italic> (SAG 41.86). A nearly two-fold difference in plastome size was observed between strains nominally identified as <italic>C. morus</italic>, representing an intraspecific size variation in green algae. The two strains of <italic>C. morus</italic> (SAG 2248 and SAG 41.86) stand out with an unprecedented genome size exceeding 550 kb, making them the largest plastomes reported within the order Sphaeropleales. Until now, plastomes of this magnitude have only been described in the green algal order Chlamydomonadales and Chaetopeltidales, such as <italic>Volvox carteri</italic>, <italic>Floydiella terrestris</italic>, <italic>Haematococcus lacustris</italic>, and <italic>H. pluvialis</italic> (<xref ref-type="bibr" rid="B48">Smith and Lee, 2009</xref>, <xref ref-type="bibr" rid="B49">2010</xref>; <xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B3">Bauman et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>). These species often share several features including high GC content, repetitive DNA, and extensive intergenic regions. Plastome inflation has been proposed to be caused by error-prone DNA repair or mutational hazard in non-coding regions and repeat-rich regions (<xref ref-type="bibr" rid="B48">Smith and Lee, 2009</xref>; <xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B46">Smith, 2018</xref>, <xref ref-type="bibr" rid="B47">2020</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>).</p>
<p>In contrast, the plastomes of all four outliers, including the two largest <italic>C. morus</italic> strains, present a unique evolutionary case. Despite their extreme size, these four outliers do not exhibit unusually high GC content (range of GC&#xa0;=&#xa0;27.4 - 30.5), nor do they show the remarkable intron density found in red algal lineages such as <italic>Bulboplastis apyrenoidosa</italic> and <italic>Corynoplastis japonica</italic>, which possess over 200 and 300 introns, respectively (<xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>). Instead, the two largest <italic>C. morus</italic> strains contain a modest 29 introns. Plastomes of the smaller outliers <italic>C. morus</italic> SAG 2078 and <italic>C. reticulatum</italic> UTEX 1365 contain only 23 and 19 introns. Taken together, these observations underscore that intron proliferation is not the main driver of non-coding region size and overall plastome enlargement in <italic>Coelastrum</italic>. This is particularly true when ignoring the outliers where we found lack of any significant correlation with intron number or size to total plastome size when outliers were removed from the analysis.</p>
<p>Our findings suggest that genome expansion in <italic>Coelastrum</italic> is primarily driven by the accumulation of non-coding sequence, particularly through the expansion of intergenic regions, rather than increased gene content or intron load. This mirrors patterns observed in <italic>Haematococcus lacustris</italic>, where plastome inflation is attributed to intergenic expansion (<xref ref-type="bibr" rid="B46">Smith, 2018</xref>), and in <italic>B. apyrenoidosa</italic>, where enlarged intergenic regions are linked to insertion sequences of bacterial origin (<xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>). Our BLAST search results of the expanded intergenic regions in <italic>C. morus</italic> yielded no significant matches, which may reflect limited genomic representation of closely related green algal taxa or potential bacterial donors in public databases.</p>
<p>In addition to intergenic expansion, repetitive DNA is a major driver of plastome enlargement. In the two largest <italic>C. morus</italic> plastomes, dispersed and tandem repeats exceed 250 kb, accounting for more than half of the total plastome length, whereas most <italic>Coelastrum</italic> plastomes contain only trace repeat content (&lt;1%), with only a single dispersed repeat in approximately half of the samples. The magnitude of this proliferation parallels <italic>Floydiella terrestris</italic>, whose plastome is composed of nearly 50% short repeats (<xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>), and the repeat-rich architecture of <italic>Haematococcus lacustris</italic>, dominated by palindromic and dispersed repeats (<xref ref-type="bibr" rid="B3">Bauman et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B46">Smith, 2018</xref>). Within <italic>Coelastrum</italic>, repeat content scales with plastome size: compact genomes harbor little repetitive DNA, whereas enlarged lineages show progressively greater accumulations, culminating in the repeat-rich <italic>C. morus</italic> (<xref ref-type="table" rid="T2"><bold>Table&#xa0;2</bold></xref>). This pattern highlights repeat proliferation as a significant contributor to genome expansion. Although the exact molecular mechanisms remain elusive, inefficient DNA repair pathways, such as break-induced replication or the accumulation of palindromic repeats, may underlie intergenic expansion in <italic>C. morus</italic> plastomes, as proposed in other green and red algal systems (<xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B47">Smith, 2020</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>).</p>
<p>In summary, the pattern in <italic>Coelastrum</italic> aligns with previous findings in green algal lineages, where plastome enlargement has been attributed to the accumulation of non-coding DNA, repeats, IR, and introns (<xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B40">Mu&#xf1;oz-G&#xf3;mez et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B55">Turmel et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B3">Bauman et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B10">Cremen et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B46">Smith, 2018</xref>, <xref ref-type="bibr" rid="B47">2020</xref>; <xref ref-type="bibr" rid="B43">Ren et&#xa0;al., 2021</xref>).</p>
<p>IR length ranged from 7,650 bp to 65,144 bp, contributing to differences in overall genome size. Multiple IR boundary shifts and gene duplications were observed, particularly involving <italic>psbC</italic>, <italic>atpF</italic>, <italic>atpH</italic>, and <italic>ftsH</italic>, indicating ongoing IR structural rearrangement. Patterns of IR boundary variation indicate that recently diverged lineages tend to exhibit more extensive IR expansions, reflected by the inclusion of additional genes into the IR (<xref ref-type="fig" rid="f2"><bold>Figure&#xa0;2</bold></xref>). These findings align with the dynamic nature of IR expansion and contraction previously described in other members of green algae (<xref ref-type="bibr" rid="B34">Lemieux et&#xa0;al., 2014</xref>; <xref ref-type="bibr" rid="B51">Turmel et&#xa0;al., 2016</xref>).</p>
<p><italic>Tetradesmus</italic> is the next most densely sampled Scenedesmaceae genus, with 13 strains (<xref ref-type="bibr" rid="B9">Cho and Lee, 2024</xref>). Total plastome size ranged from 148,816 to 196,309 bp. From this narrow perspective, the nearly tenfold range in total plastome size of <italic>Coelastrum</italic> is extraordinary, but we hope our findings will stimulate more detailed work on other Scenedesmaceae groups.</p>
</sec>
<sec id="s4_2">
<label>4.2</label>
<title>Intron dynamics</title>
<p>We focused our discussion on intron dynamics solely within <italic>Coelastrum</italic> because intron analysis has not been reported evenly across other Scenedesmaceae plastome studies. Nevertheless, <xref ref-type="bibr" rid="B61">Zhao et&#xa0;al. (2022)</xref> identified introns in seven single copy region genes, five of which also had introns in <italic>Coelastrum</italic>. The <italic>rrn23</italic> gene is the only <italic>Pectinodesmus</italic> IR gene with an intron; all <italic>Coelastrum</italic> strains have at least one intron in the same gene. <italic>Coelastrella</italic> has seven genes with introns, and all seven are shared with <italic>Coelastrum</italic> (<xref ref-type="bibr" rid="B58">Wang et&#xa0;al., 2019</xref>). <italic>Coccoidesmus</italic> was reported by <xref ref-type="bibr" rid="B57">Wang et&#xa0;al. (2024)</xref> to have introns in the large RNA subunit gene and in the <italic>psbZ</italic> gene. Introns were found in all of our large RNA subunit genes, but only in one <italic>psbZ</italic> gene (in our single strain of <italic>C. cambricum</italic> UTEX 2446, see <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Figure S2</bold></xref> and discussed below).</p>
<p>Intron diversity across the 29 <italic>Coelastrum</italic> plastomes revealed substantial lineage-specific variation in both presence and number, consistent with previous observations of dynamic intron evolution in Chlorophyta. Thirteen genes were identified as intron-bearing, with notable variability in <italic>psaA</italic>, <italic>psbA</italic>, <italic>psbC</italic>, <italic>rbcL</italic>, and <italic>rrn23</italic>. The distribution pattern largely mirrors those previously characterized in green algal plastomes, particularly in the order Sphaeropleales (<xref ref-type="bibr" rid="B18">Fu&#x10d;&#xed;kov&#xe1; et&#xa0;al., 2016</xref>; <xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>). The <italic>psaA</italic> gene consistently exhibited a trans-spliced architecture, with three exons interrupted by two introns, a synapomorphy of Sphaeropleales. This trans-splicing configuration is conserved across all <italic>Coelastrum</italic> strains sampled here. The cis-spliced configuration C1190 was absent in <italic>C. microporum</italic> (CG1) and the clade of <italic>C. reticulatum</italic> + <italic>C. morus</italic>. Within <italic>Coelastrum</italic>, this is most parsimoniously interpreted as parallel losses. The cis-spliced configuration is widely scattered across the Scenedesmaceae and certain <italic>Pediastrum</italic> species within the sister family Hydrodictyaceae (<xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>), and we hesitate, without increased taxon sampling, to conclude whether this intron presence represents parallel gains across the Sphaeropleales, whether its absence represents parallel losses, or some more complex process.</p>
<p>With the caveat that taxon sampling and reporting of intron data are still uneven in the Scenedesmaceae, it does appear that several introns may be lineage-specific or represent recent insertion events. For instance, introns in <italic>psbE</italic> (position 66) and <italic>psbZ</italic> (position 65) were restricted to <italic>C. morus</italic> (SAG 2248 and SAG 41.86) and <italic>C. cambricum</italic> (UTEX 2446), respectively. As far as we are aware, there are no previous reports of introns in <italic>psbE</italic> in any green algae. Similarly, the <italic>atpA</italic> intron (position 489) was restricted to a clade within <italic>C. astroideum</italic> strains and to one <italic>C. microporum</italic> strain (UTEX 281). This intron is shared with the distantly related <italic>Neochloris aquatica</italic>, suggesting either deep homology or a horizontal transfer event (<xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>). The group I intron in <italic>trnL-UAA</italic> was universally conserved across all <italic>Coelastrum</italic> plastomes. This intron has been reported as a vertically inherited feature across photosynthetic eukaryotes, from red algae to land plants (<xref ref-type="bibr" rid="B6">Besendahl et&#xa0;al., 2000</xref>), and its universal presence here further supports its evolutionary stability within the Chlorophyta.</p>
<p>A striking pattern of intron proliferation was observed in the <italic>psbA</italic> gene of <italic>C. morus</italic>. Strains SAG 2078, SAG 2248, and SAG 41.86 contained up to seven introns at unique insertion positions (81, 174, 273, 393, 486, 533, 741, 885), far exceeding the typical intron number (&#x2264;4) reported in <italic>Scenedesmus obliquus</italic> (<xref ref-type="bibr" rid="B11">de Cambiaire et&#xa0;al., 2006</xref>) and species within the sister family Hydrodictyaceae (<xref ref-type="bibr" rid="B36">McManus et&#xa0;al., 2018</xref>). This lineage-specific intron expansion suggests recent and rapid intron gain events.</p>
</sec>
<sec id="s4_3">
<label>4.3</label>
<title>Gene loss events</title>
<p>Most <italic>Coelastrum</italic> plastomes retain a conserved gene complement consistent with other Scenedesmaceae. However, <italic>C. reticulatum</italic> (UTEX 1365) exhibits a unique gene loss cluster affecting five adjacent protein-coding genes (<italic>clpP</italic>, <italic>rpl2</italic>, <italic>rpl23</italic>, <italic>rps4</italic>, <italic>rps19</italic>) within the SSC region, along with tRNA genes <italic>trnF</italic>-GAA and <italic>trnL</italic>-TAG. Similar clustered gene loss events have been reported in other green algae and are thought to reflect localized rearrangements, deletions, or functional transfers to the nucleus (<xref ref-type="bibr" rid="B7">Brouard et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B53">Turmel and Lemieux, 2018</xref>). Additional tRNA gene losses in <italic>C. reticulatum</italic> (SAG 8.81), <italic>C. proboscideum</italic> (UTEX 282), and outgroups such as <italic>Pectinodesmus pectinatus</italic> suggest that tRNA genes are particularly prone to loss or replacement. The gene <italic>clpP</italic> encodes a subunit of the chloroplast Clp protease, while <italic>rpl2, rpl23, rps4</italic>, and <italic>rps19</italic> encode ribosomal protein subunits, suggesting that the loss of these genes may affect plastid protease or ribosome function. Transcriptomic analysis/nuclear genome sequencing needs to be conducted to confirm loss or transfer of these genes to the nucleus.</p>
</sec>
<sec id="s4_4">
<label>4.4</label>
<title>Phylogenetic implications</title>
<p>Our recovery of <italic>Coelastrum</italic> as monophyletic highlights issues of both gene and taxon sampling in interpreting the phylogeny of the Scenedesmaceae. It is beyond the scope of this paper to resolve issues related to these problems, but we focus on two papers that clearly highlight them.</p>
<p><xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> used a relatively short sequence (ITS2). Nevertheless, we consider this to be a fundamental study because of its breadth of taxon sampling, including 106 Scenedesmaceae strains from eleven nominal genera. In contrast to our results, they recovered a non-monophyletic <italic>Coelastrum</italic>. Two strains are of particular interest because we selected them for analysis because they occupied critical positions in the <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> tree. Namely, our study and <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> included SAG 2078 (<italic>C. morus</italic>) and SAG 8.81 (<italic>H. reticulata</italic> Dangeard = <italic>C. reticulatum</italic> (Dangeard) Senn). If one were to trim away strains unique to only one study or the other, <italic>C. reticulatum</italic> SAG 8.81 would be sister to <italic>C. morus</italic> SAG 2078 in both studies. However, differences in taxon sampling exist, and one cannot ignore that <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> also recovered <italic>Coelastrella</italic> spec. SAG 217.5 (isolated from Finland), <italic>Dimorphococcus lunatus</italic> SAG 2241, and <italic>Asterarcys quadricellulare</italic> COMAS 1977&#x2013;75 as close relatives to both SAG 8.81 and <italic>Coelastrum cambricum</italic> SAG 7.81. The latter strain was not available at the time we assembled cultures and data for analysis, so we used <italic>C. cambricum</italic> UTEX 2446. ITS2 data provided only weak support at the node linking <italic>Coelastrella</italic> spec. SAG 217.5 to other taxa, whereas plastome data using the already published <italic>Coelastrella saipanensis</italic> sequence (NC042181), placed that <italic>Coelastrella</italic> strain in a position distant from all three of our <italic>C. reticulatum</italic> strains, including SAG 8.81. It is possible that <italic>Coelastrum saipanensis</italic> (NC042181) and <italic>C</italic>. spec. SAG 217.5 belong to different lineages, and/or that other taxon sampling differences influenced the relationship of <italic>Coelastrella</italic> to <italic>Coelastrum</italic>. We also note that the deeper nodes of the <italic>Coelastrum sensu lato</italic> branch had very low BS support in <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref>, indicating that differences between their tree and ours may also be due to gene sampling and low resolving power of the ITS2 at critical nodes.</p>
<p>A much more recent paper used multiple longer sequences in three independent analyses, and again illustrated that both gene and strain sampling affect tree topologies. <xref ref-type="bibr" rid="B57">Wang et&#xa0;al. (2024)</xref> analyzed nuclear ITS data (referred to only as the &#x201c;ITS region&#x201d; in that study), the nuclear SSU (18S), and the plastome gene <italic>tufA</italic> independently of one another, each with a similar but not identical taxon sampling design. <italic>Coelastrum</italic> was recovered as monophyletic with 18S data, but the only two species included were <italic>C. proboscideum</italic> (SAG 217-3) and <italic>C.</italic> sp<italic>haericum</italic> (SAG 217-2). <italic>Hariotina reticulata</italic> (SAG 8.81) was embedded in a monophyletic <italic>Hariotina</italic> and that genus was several nodes away from <italic>Coelastrum</italic>. However, neither genus was monophyletic when ITS data were analyzed, and different <italic>Coelastrum</italic> strains (<italic>C. astroideum</italic> var. <italic>rugosum</italic> RW10 and <italic>C. microporum</italic> FNY-1) were employed. Finally, with <italic>tufA</italic> data, and using a third pair of <italic>Coelastrum</italic> (<italic>C.</italic> sp<italic>haericum</italic> CCMA UFSCar 060, and <italic>C.</italic> sp. YN 15-2), a monophyletic <italic>Coelastrum</italic> was recovered as sister to a monophyletic <italic>Hariotina</italic>.</p>
<p>We are not criticizing <xref ref-type="bibr" rid="B57">Wang et&#xa0;al. (2024)</xref>, as they used sequences available in NCBI, and they discussed several points of incongruence. We only use <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref> and <xref ref-type="bibr" rid="B57">Wang et&#xa0;al. (2024)</xref> to illustrate that molecular phylogenetic studies need to account for strain and taxon sampling as well as gene sampling when discussing classification. Finally, we note that the SSU and ITS data are from one compartment (nuclear genome) and the <italic>tufA</italic> data are from another (the plastome). The possibility of distinct gene trees and organismal trees must be considered as well when attempting to corroborate or reject monophyly for <italic>Coelastrum</italic>.</p>
<p>In summary, future studies of classification using phylogenomic data obviously need to include both more outgroup and ingroup taxa, and more strain representatives for each species, to conclusively support or reject <italic>Coelastrum</italic> as monophyletic.</p>
<p>Looking towards lower-level classifications, towards the tips of the plastome tree, there is general agreement between species names and plastome genetic diversity. Plastome data also recovered hierarchical structure within nominal species. Discovery of additional diversity within a historical morphological classification at the species level by the use of DNA sequence data often leads to the invocation of &#x201c;cryptic species&#x201d;, but morphology in algae is usually treated in some sort of non-canonical fashion, whereas molecular data are treated phylogenetically (<xref ref-type="bibr" rid="B2">Alverson, 2008</xref>).</p>
<p>The phylogenetic species concept demands only that a species be the smallest monophyletic group that a systematist cares to name. That is, grouping is objective, but naming is arbitrary (<xref ref-type="bibr" rid="B17">Frost and Kluge, 1994</xref>; <xref ref-type="bibr" rid="B2">Alverson, 2008</xref>; <xref ref-type="bibr" rid="B38">Mishler and Theriot, 2000</xref>). Multiple strains of each of <italic>C. morus</italic>, <italic>C. reticulatum</italic>, <italic>C. astroideum</italic>, and <italic>C. pseudomicroporum</italic> are each supported as monophyletic with BS support of 100%.</p>
<p>However, phylogenetic structure was recovered within each of these clades, with plastome size and sequence contributing to diversity in all four clades (<xref ref-type="fig" rid="f1"><bold>Figure&#xa0;1</bold></xref> and <xref ref-type="table" rid="T1"><bold>Table&#xa0;1</bold></xref>). The clade of <italic>C. morus</italic> strains recovered two (SAG 2248 and SAG 41.86) with plastomes of over 500 kb and a third (SAG 2078) whose genome was almost 300 kb (compared to a median of about 180 kb). The two largest plastomes could represent one phylogenetic species and SAG 2078 could possibly represent a second. Similarly, there was one strain of <italic>C. reticulatum</italic> (UTEX 1365) with a plastome nearly 40 kb larger than that of <italic>C. reticulatum</italic> CG10, and nearly 48 kb larger than that of <italic>C. reticulatum</italic> SAG 8.81. <italic>Coelastrum asteroideum</italic> is represented by at least two distinct clades each receiving 100% BS support (strains CG6 and CW1; strains CS1, CS3, CS9, and SAG 33.88). The former two strains had nearly identical sequences, and also the largest plastomes among nominal <italic>C. asteroideum</italic> differing in length by only 56 bases between the two. However, the Swan Lake strains (CS1, CS3, and CS9) differed by about 3 kb, and SAG 33.88 was another 2 kb larger than the largest Swan Lake strain (6 kb smaller than the CG6 and CW1 strains). Plastomes of <italic>C. pseudomicroporum</italic> were recovered in two subclades (CLB and UTEX 1353; SAG 2077 and UTEX 280). Sister strains UTEX 1353 and CLB had the smallest and largest plastomes of <italic>C. pseudomicroporum</italic>, being nearly 13 kb difference in size.</p>
<p>Plastome size differences within these <italic>Coelastrum</italic> clades ranged from 100 bp differences to several hundred thousand bp differences. The biological meaning is unclear and there are no clear guidelines to be taken from the general literature on Viridiplantae plastome size and species diagnosis. For example, in vascular plants, species of pears are known to interbreed when plastome sizes differ in terms of only a few hundred bases (<xref ref-type="bibr" rid="B28">Kim et&#xa0;al., 2024</xref>). On the other hand, differences in plastome size of as much as 20 kb are considered intraspecific in the widely cultivated <italic>Peucedanum japonicum</italic> (<xref ref-type="bibr" rid="B25">Joh et&#xa0;al., 2025</xref>). We are confident that increasing strain sampling in green microalgae will find other such perplexing and interesting observations.</p>
<p>The non-monophyly of <italic>C. microporum</italic> strains presents a different set of issues. There are three distinct lineages. One strain (UTEX 281) is embedded within a clade that includes <italic>C. indicum</italic> (SAG 2363) and <italic>C. cambricum</italic> (UTEX 2446), while CF1 and SAG 2292 form a clade of strains with nearly identical sequences, as do CS5, CW5 and UTEX 1354. Again, we observe variation among nominal strains of <italic>C. microporum</italic> of as much as 20 kb. These inconsistencies may reflect simple taxonomic misidentification, incomplete lineage sorting, and/or historical hybridization events.</p>
<p>Two species mentioned several times in various studies are particularly in need of revision and probably need to be considered synonymous. <italic>Coelastrum</italic> sp<italic>haericum</italic> and <italic>C. proboscideum</italic> have been difficult to resolve both with morphology and genetic data. <xref ref-type="bibr" rid="B29">Kom&#xe1;rek and Fott (1983)</xref> claimed that these species differ in apical structure, with the former being formed by small bumps, and the latter representing a crown-like structure. Others have considered the two species synonymous (<xref ref-type="bibr" rid="B20">Hajdu et&#xa0;al., 1976</xref>). Our results are consistent with the findings of <xref ref-type="bibr" rid="B22">Hegewald et&#xa0;al. (2010)</xref>, who suggested a persistent phylogenetic signal despite differences in molecular markers used (e.g., nuclear ITS). Such a signal, interpreted as shared apomorphic similarity in morphology and DNA sequence, strongly supports the classification of <italic>C.</italic> sp<italic>haericum</italic> and <italic>C. proboscideum</italic> as a single phylogenetic species. We note again, however, that the largest plastome is more than 4 kb larger than the smallest. Thus, such inferences will be more powerful once broader strain sampling is done across both data sets.</p>
<p>In summary, phylogenetic resolution may be constrained by limited taxon sampling (<xref ref-type="bibr" rid="B23">Hillis, 1998</xref>; <xref ref-type="bibr" rid="B42">Pollock et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B63">Zwickl and Hillis, 2002</xref>; <xref ref-type="bibr" rid="B21">Heath et&#xa0;al., 2008</xref>), especially in cases where only a single strain represents a species. In such instances, intraspecific variability remains unassessed, which may mask deeper population structure or contribute to apparent paraphyly. Finding strains that are very similar in coding region sequence, with shared morphological characteristics, but very different plastome sizes, in all of our clades underscores the need to expand strain sampling across multiple populations per species to better understand species classification and diagnosis in these green algae.</p>
</sec>
</sec>
<sec id="s5" sec-type="conclusions">
<label>5</label>
<title>Conclusion</title>
<p>This study presents the most comprehensive species and strain-level analysis of plastid genome evolution in <italic>Coelastrum</italic>, a morphologically diverse and ecologically important genus within the Scenedesmaceae. We demonstrate that plastome size variation in <italic>Coelastrum</italic> is primarily explained by the expansion of intergenic regions and accumulation of repetitive DNA, with additional contributions from variation in IR length and, in some cases, intron content. While most plastomes retain a conserved gene complement, lineage-specific gene loss and intron dynamics highlight the ongoing evolutionary plasticity of these organellar genomes. We observed an almost twofold difference in plastome size among strains of the same nominal species, <italic>C. morus</italic>. There was a less impressive but still large difference in plastome size among lineages in <italic>C. reticulatum</italic> (that of UTEX 1365 was 16% larger than the other two strains).</p>
<p>The plastome-based phylogeny reveals well-resolved relationships among species and supports the utility of plastome data for refining taxonomic classification in green algae. These findings contribute to our understanding of structural genome evolution in Chlorophyta and underscore the importance of expanding sampling at the species and strain levels in plastome studies.</p>
<p>Future work integrating nuclear and mitochondrial genomes, along with ecological data, will help resolve the evolutionary forces shaping organelle genome architecture in <italic>Coelastrum</italic> and other green algal lineages. Although classification was not the focus of our study, our plastome analysis also identified areas of congruence and incongruence between morphology and molecular markers, which bear further study.</p>
</sec>
</body>
<back>
<sec id="s6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <uri xlink:href="https://figshare.com/articles/dataset/Complete_annotated_chloroplast_genome_sequences_of_29_i_Coelastrum_i_strains_Sphaeropleales_Chlorophyta_/30482909">https://figshare.com/articles/dataset/Complete_annotated_chloroplast_genome_sequences_of_29_i_Coelastrum_i_strains_Sphaeropleales_Chlorophyta_/30482909</uri></p></sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>CL: Methodology, Formal analysis, Writing &#x2013; review &amp; editing, Writing &#x2013; original draft, Data curation, Visualization, Conceptualization. RJ: Supervision, Writing &#x2013; review &amp; editing. ET: Conceptualization, Project administration, Writing &#x2013; review &amp; editing, Funding acquisition, Supervision, Resources.</p></sec>
<ack>
<title>Acknowledgments</title>
<p>The authors thank Chaehee Lee for assistance in data analysis, and Joshua Cooper and Francesca Moroni for assistance in bioinformatics. Michelle Mikesh was of great help in preparing specimens for SEM. Elena Litchman and Allyson Hutchens provide invaluable logistical support to collect and isolate <italic>Coelastrum</italic> spp. from the state of Michigan (USA) used in this study.</p>
</ack>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The author(s) declared that this work was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
<sec id="s10" sec-type="ai-statement">
<title>Generative AI statement</title>
<p>The author(s) declared that generative AI was not used in the creation of this manuscript.</p>
<p>Any alternative text (alt text) provided alongside figures in this article has been generated by Frontiers with the support of artificial intelligence and reasonable efforts have been made to ensure accuracy, including review by the authors wherever possible. If you identify any issues, please contact us.</p></sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p></sec>
<sec id="s12" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2026.1736783/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2026.1736783/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Altschul</surname> <given-names>S. F.</given-names></name>
<name><surname>Gish</surname> <given-names>W.</given-names></name>
<name><surname>Miller</surname> <given-names>W.</given-names></name>
<name><surname>Myers</surname> <given-names>E. W.</given-names></name>
<name><surname>Lipman</surname> <given-names>D. J.</given-names></name>
</person-group> (<year>1990</year>). 
<article-title>Basic local alignment search tool</article-title>. <source>J. Mol. Biol.</source> <volume>215</volume>, <fpage>403</fpage>&#x2013;<lpage>410</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/S0022-2836(05)80360-2</pub-id>, PMID: <pub-id pub-id-type="pmid">2231712</pub-id>
</mixed-citation>
</ref>
<ref id="B2">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Alverson</surname> <given-names>A. J.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Molecular systematics and the diatom species</article-title>. <source>Protist</source> <volume>159</volume>, <fpage>339</fpage>&#x2013;<lpage>353</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.protis.2008.04.001</pub-id>, PMID: <pub-id pub-id-type="pmid">18539524</pub-id>
</mixed-citation>
</ref>
<ref id="B3">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bauman</surname> <given-names>N.</given-names></name>
<name><surname>Akella</surname> <given-names>S.</given-names></name>
<name><surname>Hann</surname> <given-names>E.</given-names></name>
<name><surname>Morey</surname> <given-names>R.</given-names></name>
<name><surname>Schwartz</surname> <given-names>A. S.</given-names></name>
<name><surname>Brown</surname> <given-names>R.</given-names></name>
<etal/>
</person-group>. (<year>2018</year>). 
<article-title>Next-generation sequencing of Haematococcus lacustris reveals an extremely large 1.35-megabase chloroplast genome</article-title>. <source>Genome Announc.</source> <volume>6</volume>, <fpage>e00181</fpage>&#x2013;<lpage>e00118</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/genomeA.00181-18</pub-id>, PMID: <pub-id pub-id-type="pmid">29567741</pub-id>
</mixed-citation>
</ref>
<ref id="B4">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>B&#xe9;langer</surname> <given-names>A.-S.</given-names></name>
<name><surname>Brouard</surname> <given-names>J.-S.</given-names></name>
<name><surname>Charlebois</surname> <given-names>P.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>Distinctive architecture of the chloroplast genome in the chlorophycean green alga Stigeoclonium helveticum</article-title>. <source>Mol. Genet. Genomics MGG</source> <volume>276</volume>, <fpage>464</fpage>&#x2013;<lpage>477</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00438-006-0156-2</pub-id>, PMID: <pub-id pub-id-type="pmid">16944205</pub-id>
</mixed-citation>
</ref>
<ref id="B5">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Benson</surname> <given-names>G.</given-names></name>
</person-group> (<year>1999</year>). 
<article-title>Tandem repeats finder: a program to analyze DNA sequences</article-title>. <source>Nucleic Acids Res.</source> <volume>27</volume>, <fpage>573</fpage>&#x2013;<lpage>580</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/27.2.573</pub-id>, PMID: <pub-id pub-id-type="pmid">9862982</pub-id>
</mixed-citation>
</ref>
<ref id="B6">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Besendahl</surname> <given-names>A.</given-names></name>
<name><surname>Qiu</surname> <given-names>Y. L.</given-names></name>
<name><surname>Lee</surname> <given-names>J.</given-names></name>
<name><surname>Palmer</surname> <given-names>J. D.</given-names></name>
<name><surname>Bhattacharya</surname> <given-names>D.</given-names></name>
</person-group> (<year>2000</year>). 
<article-title>The cyanobacterial origin and vertical transmission of the plastid tRNA(Leu) group-I intron</article-title>. <source>Curr. Genet.</source> <volume>37</volume>, <fpage>12</fpage>&#x2013;<lpage>23</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s002940050002</pub-id>, PMID: <pub-id pub-id-type="pmid">10672439</pub-id>
</mixed-citation>
</ref>
<ref id="B7">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Brouard</surname> <given-names>J.-S.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>The exceptionally large chloroplast genome of the green alga Floydiella terrestris illuminates the evolutionary history of the Chlorophyceae</article-title>. <source>Genome Biol. Evol.</source> <volume>2</volume>, <fpage>240</fpage>&#x2013;<lpage>256</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evq014</pub-id>, PMID: <pub-id pub-id-type="pmid">20624729</pub-id>
</mixed-citation>
</ref>
<ref id="B8">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Bushnell</surname> <given-names>B</given-names></name>
</person-group>. (<year>2014</year>). 
<article-title>BBMap: A fast, accurate, splice-aware aligner. Lawrence Berkeley National Laboratory</article-title>. <source>LBNL Report #: LBNL-7065E</source>. Available online at: <uri xlink:href="https://escholarship.org/uc/item/1h3515gn">https://escholarship.org/uc/item/1h3515gn</uri>
</mixed-citation>
</ref>
<ref id="B9">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cho</surname> <given-names>H. S.</given-names></name>
<name><surname>Lee</surname> <given-names>J.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Taxonomic reinvestigation of the genus Tetradesmus (Scenedesmaceae; Sphaeropleales) based on morphological characteristics and chloroplast genomes</article-title>. <source>Front. Plant Sci.</source> <volume>15</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fpls.2024.1303175</pub-id>, PMID: <pub-id pub-id-type="pmid">38419779</pub-id>
</mixed-citation>
</ref>
<ref id="B10">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Cremen</surname> <given-names>M. C. M.</given-names></name>
<name><surname>Leliaert</surname> <given-names>F.</given-names></name>
<name><surname>Marcelino</surname> <given-names>V. R.</given-names></name>
<name><surname>Verbruggen</surname> <given-names>H.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Large diversity of nonstandard genes and dynamic evolution of chloroplast genomes in siphonous green algae (Bryopsidales, Chlorophyta)</article-title>. <source>Genome Biol. Evol.</source> <volume>10</volume>, <fpage>1048</fpage>&#x2013;<lpage>1061</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evy063</pub-id>, PMID: <pub-id pub-id-type="pmid">29635329</pub-id>
</mixed-citation>
</ref>
<ref id="B11">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>de Cambiaire</surname> <given-names>J.-C.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
</person-group> (<year>2006</year>). 
<article-title>The complete chloroplast genome sequence of the chlorophycean green alga Scenedesmus obliquus reveals a compact gene organization and a biased distribution of genes on the two DNA strands</article-title>. <source>BMC Evol. Biol.</source> <volume>6</volume>, <elocation-id>37</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2148-6-37</pub-id>, PMID: <pub-id pub-id-type="pmid">16638149</pub-id>
</mixed-citation>
</ref>
<ref id="B12">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>de Cambiaire</surname> <given-names>J.-C.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>The chloroplast genome sequence of the green alga Leptosira terrestris: multiple losses of the inverted repeat and extensive genome rearrangements within the Trebouxiophyceae</article-title>. <source>BMC Genomics</source> <volume>8</volume>, <elocation-id>213</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-8-213</pub-id>, PMID: <pub-id pub-id-type="pmid">17610731</pub-id>
</mixed-citation>
</ref>
<ref id="B13">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Dierckxsens</surname> <given-names>N.</given-names></name>
<name><surname>Mardulyn</surname> <given-names>P.</given-names></name>
<name><surname>Smits</surname> <given-names>G.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>NOVOPlasty: <italic>de novo</italic> assembly of organelle genomes from whole genome data</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <elocation-id>e18</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkw955</pub-id>, PMID: <pub-id pub-id-type="pmid">28204566</pub-id>
</mixed-citation>
</ref>
<ref id="B14">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Douchi</surname> <given-names>D.</given-names></name>
<name><surname>Mosey</surname> <given-names>M.</given-names></name>
<name><surname>Astling</surname> <given-names>D. P.</given-names></name>
<name><surname>Knoshaug</surname> <given-names>E. P.</given-names></name>
<name><surname>Nag</surname> <given-names>A.</given-names></name>
<name><surname>McGowen</surname> <given-names>J.</given-names></name>
<etal/>
</person-group>. (<year>2021</year>). 
<article-title>Nuclear and chloroplast genome engineering of a productive non-model alga <italic>Desmodesmus armatus</italic>: Insights into unusual and selective acquisition mechanisms for foreign DNA</article-title>. <source>Algal Res.</source> <volume>53</volume>, <elocation-id>102152</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.algal.2020.102152</pub-id>
</mixed-citation>
</ref>
<ref id="B15">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fenwick</surname> <given-names>M. G.</given-names></name>
</person-group> (<year>1968</year>). 
<article-title>Review of the status of some green algae in the genus Coelastrum</article-title>. <source>Mich. Bot.</source> <volume>7</volume>, <fpage>129</fpage>&#x2013;<lpage>131</lpage>.
</mixed-citation>
</ref>
<ref id="B16">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fenwick</surname> <given-names>M. G.</given-names></name>
<name><surname>Hansen</surname> <given-names>L. O.</given-names></name>
<name><surname>Lynch</surname> <given-names>D. L.</given-names></name>
</person-group> (<year>1966</year>). 
<article-title>Polymorphic forms of Coelastrum proboscideum Bohn</article-title>. <source>Trans. Am. Microsc. Soc</source> <volume>85</volume>, <fpage>579</fpage>&#x2013;<lpage>581</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2307/3224488</pub-id>
</mixed-citation>
</ref>
<ref id="B17">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Frost</surname> <given-names>D. R.</given-names></name>
<name><surname>Kluge</surname> <given-names>A. G.</given-names></name>
</person-group> (<year>1994</year>). 
<article-title>A consideration of epistemology in systematic biology, with special reference to species</article-title>. <source>Cladistics</source> <volume>10</volume>, <fpage>259</fpage>&#x2013;<lpage>294</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1006/clad.1994.1018</pub-id>
</mixed-citation>
</ref>
<ref id="B18">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Fu&#x10d;&#xed;kov&#xe1;</surname> <given-names>K.</given-names></name>
<name><surname>Lewis</surname> <given-names>L. A.</given-names></name>
<name><surname>Lewis</surname> <given-names>P. O.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>Comparative analyses of chloroplast genome data representing nine green algae in Sphaeropleales (Chlorophyceae, Chlorophyta)</article-title>. <source>Data Brief</source> <volume>7</volume>, <fpage>558</fpage>&#x2013;<lpage>570</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dib.2016.03.014</pub-id>, PMID: <pub-id pub-id-type="pmid">27054159</pub-id>
</mixed-citation>
</ref>
<ref id="B19">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Guillard</surname> <given-names>R. R. L.</given-names></name>
</person-group> (<year>1975</year>). &#x201c;
<article-title>Culture of phytoplankton for feeding marine invertebrates</article-title>,&#x201d; in <source>Culture of Marine Invertebrate Animals: Proceedings &#x2014; 1st Conference on Culture of Marine Invertebrate Animals Greenport</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Smith</surname> <given-names>W. L.</given-names></name>
<name><surname>Chanley</surname> <given-names>M. H.</given-names></name>
</person-group> (
<publisher-name>Springer US</publisher-name>, <publisher-loc>Boston, MA</publisher-loc>), <fpage>29</fpage>&#x2013;<lpage>60</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-4615-8714-9_3</pub-id>
</mixed-citation>
</ref>
<ref id="B20">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hajdu</surname> <given-names>L.</given-names></name>
<name><surname>Hegewald</surname> <given-names>E.</given-names></name>
<name><surname>Cronberg</surname> <given-names>G.</given-names></name>
</person-group> (<year>1976</year>). 
<article-title>Beitr&#xe4;ge zur Taxonomie der Gattung Coelastrum (Chlorophyta, Chlorococcales)</article-title>. <source>Ann. Hist. Nat. Musei Natl. Hung.</source> <volume>68</volume>, <fpage>31</fpage>&#x2013;<lpage>38</lpage>.
</mixed-citation>
</ref>
<ref id="B21">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Heath</surname> <given-names>T. A.</given-names></name>
<name><surname>Hedtke</surname> <given-names>S. M.</given-names></name>
<name><surname>Hillis</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>2008</year>). 
<article-title>Taxon sampling and the accuracy of phylogenetic analyses</article-title>. <source>J. Syst. Evol.</source> <volume>46</volume>, <fpage>239</fpage>&#x2013;<lpage>257</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3724/SP.J.1002.2008.08016</pub-id>
</mixed-citation>
</ref>
<ref id="B22">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hegewald</surname> <given-names>E.</given-names></name>
<name><surname>Wolf</surname> <given-names>M.</given-names></name>
<name><surname>Keller</surname> <given-names>A.</given-names></name>
<name><surname>Friedl</surname> <given-names>T.</given-names></name>
<name><surname>Krienitz</surname> <given-names>L.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>ITS2 sequence-structure phylogeny in the Scenedesmaceae with special reference to Coelastrum (Chlorophyta, Chlorophyceae), including the new genera Comasiella and Pectinodesmus</article-title>. <source>Phycologia</source> <volume>49</volume>, <fpage>325</fpage>&#x2013;<lpage>335</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2216/09-61.1</pub-id>
</mixed-citation>
</ref>
<ref id="B23">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Hillis</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>1998</year>). 
<article-title>Taxonomic sampling, phylogenetic accuracy, and investigator bias</article-title>. <source>Syst. Biol.</source> <volume>47</volume>, <fpage>3</fpage>&#x2013;<lpage>8</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/106351598260987</pub-id>, PMID: <pub-id pub-id-type="pmid">12064238</pub-id>
</mixed-citation>
</ref>
<ref id="B24">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Jansen</surname> <given-names>R. K.</given-names></name>
<name><surname>Ruhlman</surname> <given-names>T. A.</given-names></name>
</person-group> (<year>2012</year>). &#x201c;
<article-title>Plastid genomes of seed plants</article-title>,&#x201d; in <source>Genomics of Chloroplasts and Mitochondria</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Bock</surname> <given-names>R.</given-names></name>
<name><surname>Knoop</surname> <given-names>V.</given-names></name>
</person-group> (
<publisher-name>Springer Netherlands</publisher-name>, <publisher-loc>Dordrecht</publisher-loc>), <fpage>103</fpage>&#x2013;<lpage>126</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-94-007-2920-9_5</pub-id>
</mixed-citation>
</ref>
<ref id="B25">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Joh</surname> <given-names>H. J.</given-names></name>
<name><surname>Park</surname> <given-names>Y. S.</given-names></name>
<name><surname>Kang</surname> <given-names>J.-S.</given-names></name>
<name><surname>Kim</surname> <given-names>J. T.</given-names></name>
<name><surname>Lado</surname> <given-names>J. P.</given-names></name>
<name><surname>Han</surname> <given-names>S. I.</given-names></name>
<etal/>
</person-group>. (<year>2025</year>). 
<article-title>A recent large-scale intraspecific IR expansion and evolutionary dynamics of the plastome of Peucedanum japonicum</article-title>. <source>Sci. Rep.</source> <volume>15</volume>, <fpage>104</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-024-84540-8</pub-id>, PMID: <pub-id pub-id-type="pmid">39748098</pub-id>
</mixed-citation>
</ref>
<ref id="B26">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kalyaanamoorthy</surname> <given-names>S.</given-names></name>
<name><surname>Minh</surname> <given-names>B. Q.</given-names></name>
<name><surname>Wong</surname> <given-names>T. K. F.</given-names></name>
<name><surname>von Haeseler</surname> <given-names>A.</given-names></name>
<name><surname>Jermiin</surname> <given-names>L. S.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>ModelFinder: fast model selection for accurate phylogenetic estimates</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>587</fpage>&#x2013;<lpage>589</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id>, PMID: <pub-id pub-id-type="pmid">28481363</pub-id>
</mixed-citation>
</ref>
<ref id="B27">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Katoh</surname> <given-names>K.</given-names></name>
<name><surname>Standley</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>2013</year>). 
<article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>772</fpage>&#x2013;<lpage>780</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id>, PMID: <pub-id pub-id-type="pmid">23329690</pub-id>
</mixed-citation>
</ref>
<ref id="B28">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kim</surname> <given-names>J. S.</given-names></name>
<name><surname>Chung</surname> <given-names>H.</given-names></name>
<name><surname>Park</surname> <given-names>B.</given-names></name>
<name><surname>Veerappan</surname> <given-names>K.</given-names></name>
<name><surname>Kim</surname> <given-names>Y. K.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Chloroplast genome sequencing and divergence analysis of 18 Pyrus species: insights into intron length polymorphisms and evolutionary processes</article-title>. <source>Front. Genet.</source> <volume>15</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fgene.2024.1468596</pub-id>, PMID: <pub-id pub-id-type="pmid">39507619</pub-id>
</mixed-citation>
</ref>
<ref id="B29">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Kom&#xe1;rek</surname> <given-names>J.</given-names></name>
<name><surname>Fott</surname> <given-names>B.</given-names></name>
</person-group> (<year>1983</year>). 
<article-title>Das phytoplankton des S&#xfc;&#xdf;wassers</article-title>. <source>Systematik und Biologie. Teil</source> <volume>7</volume>, <fpage>1</fpage>.
</mixed-citation>
</ref>
<ref id="B30">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lagesen</surname> <given-names>K.</given-names></name>
<name><surname>Hallin</surname> <given-names>P.</given-names></name>
<name><surname>R&#xf8;dland</surname> <given-names>E. A.</given-names></name>
<name><surname>Staerfeldt</surname> <given-names>H.-H.</given-names></name>
<name><surname>Rognes</surname> <given-names>T.</given-names></name>
<name><surname>Ussery</surname> <given-names>D. W.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>RNAmmer: consistent and rapid annotation of ribosomal RNA genes</article-title>. <source>Nucleic Acids Res.</source> <volume>35</volume>, <fpage>3100</fpage>&#x2013;<lpage>3108</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkm160</pub-id>, PMID: <pub-id pub-id-type="pmid">17452365</pub-id>
</mixed-citation>
</ref>
<ref id="B31">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Lang</surname> <given-names>B. F.</given-names></name>
<name><surname>Nedelcu</surname> <given-names>A. M.</given-names></name>
</person-group> (<year>2012</year>). <source>Plastid genomes of algae</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Bock</surname> <given-names>R.</given-names></name>
<name><surname>Knoop</surname> <given-names>V.</given-names></name>
</person-group> (<publisher-loc>Dordrecht</publisher-loc>: 
<publisher-name>Springer Netherlands</publisher-name>), <fpage>59</fpage>&#x2013;<lpage>87</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-94-007-2920-9_3</pub-id>
</mixed-citation>
</ref>
<ref id="B32">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lee</surname> <given-names>C.</given-names></name>
<name><surname>Cooper</surname> <given-names>J. T.</given-names></name>
<name><surname>Moroni</surname> <given-names>F.</given-names></name>
<name><surname>Salim</surname> <given-names>A. M.</given-names></name>
<name><surname>Lee</surname> <given-names>C.</given-names></name>
<name><surname>Spanbauer</surname> <given-names>T.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Complete plastome of Coelastrum microporum N&#xe4;geli (Scenedesmaceae, Sphaeropleales)</article-title>. <source>Mitochondrial DNA Part B Resour.</source> <volume>8</volume>, <fpage>948</fpage>&#x2013;<lpage>951</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/23802359.2023.2252941</pub-id>, PMID: <pub-id pub-id-type="pmid">37701527</pub-id>
</mixed-citation>
</ref>
<ref id="B33">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lee</surname> <given-names>C.</given-names></name>
<name><surname>Ruhlman</surname> <given-names>T. A.</given-names></name>
<name><surname>Jansen</surname> <given-names>R. K.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Unprecedented intraindividual structural heteroplasmy in eleocharis (Cyperaceae, poales) plastomes</article-title>. <source>Genome Biol. Evol.</source> <volume>12</volume>, <fpage>641</fpage>&#x2013;<lpage>655</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evaa076</pub-id>, PMID: <pub-id pub-id-type="pmid">32282915</pub-id>
</mixed-citation>
</ref>
<ref id="B34">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
</person-group> (<year>2014</year>). 
<article-title>Six newly sequenced chloroplast genomes from prasinophyte green algae provide insights into the relationships among prasinophyte lineages and the diversity of streamlined genome architecture in picoplanktonic species</article-title>. <source>BMC Genomics</source> <volume>15</volume>, <elocation-id>857</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-15-857</pub-id>, PMID: <pub-id pub-id-type="pmid">25281016</pub-id>
</mixed-citation>
</ref>
<ref id="B35">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Lowe</surname> <given-names>T. M.</given-names></name>
<name><surname>Chan</surname> <given-names>P. P.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>tRNAscan-SE On-line: integrating search and context for analysis of transfer RNA genes</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>, <fpage>W54</fpage>&#x2013;<lpage>W57</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkw413</pub-id>, PMID: <pub-id pub-id-type="pmid">27174935</pub-id>
</mixed-citation>
</ref>
<ref id="B36">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>McManus</surname> <given-names>H. A.</given-names></name>
<name><surname>Fu&#x10d;&#xed;kov&#xe1;</surname> <given-names>K.</given-names></name>
<name><surname>Lewis</surname> <given-names>P. O.</given-names></name>
<name><surname>Lewis</surname> <given-names>L. A.</given-names></name>
<name><surname>Karol</surname> <given-names>K. G.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Organellar phylogenomics inform systematics in the green algal family Hydrodictyaceae (Chlorophyceae) and provide clues to the complex evolutionary history of plastid genomes in the green algal tree of life</article-title>. <source>Am. J. Bot.</source> <volume>105</volume>, <fpage>315</fpage>&#x2013;<lpage>329</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/ajb2.1066</pub-id>, PMID: <pub-id pub-id-type="pmid">29722901</pub-id>
</mixed-citation>
</ref>
<ref id="B37">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Minh</surname> <given-names>B. Q.</given-names></name>
<name><surname>Schmidt</surname> <given-names>H. A.</given-names></name>
<name><surname>Chernomor</surname> <given-names>O.</given-names></name>
<name><surname>Schrempf</surname> <given-names>D.</given-names></name>
<name><surname>Woodhams</surname> <given-names>M. D.</given-names></name>
<name><surname>von Haeseler</surname> <given-names>A.</given-names></name>
<etal/>
</person-group>. (<year>2020</year>). 
<article-title>IQ-TREE 2: new models and efficient methods for phylogenetic inference in the genomic era</article-title>. <source>Mol. Biol. Evol.</source> <volume>37</volume>, <fpage>1530</fpage>&#x2013;<lpage>1534</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msaa015</pub-id>, PMID: <pub-id pub-id-type="pmid">32011700</pub-id>
</mixed-citation>
</ref>
<ref id="B38">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Mishler</surname> <given-names>B. D.</given-names></name>
<name><surname>Theriot</surname> <given-names>E.</given-names></name>
</person-group> (<year>2000</year>). &#x201c;
<article-title>The phylogenetic species concept (sensu Mishler and Theriot): Monophyly, apomorphy, and phylogenetic species concepts</article-title>,&#x201d; in <source>Species Concepts and Phylogenetic Theory: A Debate</source> (
<publisher-name>Columbia University Press</publisher-name>, <publisher-loc>New York</publisher-loc>), <fpage>44</fpage>&#x2013;<lpage>54</lpage>.
</mixed-citation>
</ref>
<ref id="B39">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Mower</surname> <given-names>J. P.</given-names></name>
<name><surname>Vickrey</surname> <given-names>T. L.</given-names></name>
</person-group> (<year>2018</year>). &#x201c;
<article-title>Chapter nine - Structural diversity among plastid genomes of land plants</article-title>,&#x201d; in <source>Advances in Botanical Research</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Chaw</surname> <given-names>S.-M.</given-names></name>
<name><surname>Jansen</surname> <given-names>R. K.</given-names></name>
</person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: 
<publisher-name>Academic Press</publisher-name>), <fpage>263</fpage>&#x2013;<lpage>292</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/bs.abr.2017.11.013</pub-id>
</mixed-citation>
</ref>
<ref id="B40">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Mu&#xf1;oz-G&#xf3;mez</surname> <given-names>S. A.</given-names></name>
<name><surname>Mej&#xed;a-Franco</surname> <given-names>F. G.</given-names></name>
<name><surname>Durnin</surname> <given-names>K.</given-names></name>
<name><surname>Colp</surname> <given-names>M.</given-names></name>
<name><surname>Grisdale</surname> <given-names>C. J.</given-names></name>
<name><surname>Archibald</surname> <given-names>J. M.</given-names></name>
<etal/>
</person-group>. (<year>2017</year>). 
<article-title>The new red algal subphylum proteorhodophytina comprises the largest and most divergent plastid genomes known</article-title>. <source>Curr. Biol. CB</source> <volume>27</volume>, <fpage>1677</fpage>&#x2013;<lpage>1684.e4</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cub.2017.04.054</pub-id>, PMID: <pub-id pub-id-type="pmid">28528908</pub-id>
</mixed-citation>
</ref>
<ref id="B41">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Palenik</surname> <given-names>B.</given-names></name>
<name><surname>Grimwood</surname> <given-names>J.</given-names></name>
<name><surname>Aerts</surname> <given-names>A.</given-names></name>
<name><surname>Rouz&#xe9;</surname> <given-names>P.</given-names></name>
<name><surname>Salamov</surname> <given-names>A.</given-names></name>
<name><surname>Putnam</surname> <given-names>N.</given-names></name>
<etal/>
</person-group>. (<year>2007</year>). 
<article-title>The tiny eukaryote Ostreococcus provides genomic insights into the paradox of plankton speciation</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>104</volume>, <fpage>7705</fpage>&#x2013;<lpage>7710</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0611046104</pub-id>, PMID: <pub-id pub-id-type="pmid">17460045</pub-id>
</mixed-citation>
</ref>
<ref id="B42">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Pollock</surname> <given-names>D. D.</given-names></name>
<name><surname>Zwickl</surname> <given-names>D. J.</given-names></name>
<name><surname>McGuire</surname> <given-names>J. A.</given-names></name>
<name><surname>Hillis</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>2002</year>). 
<article-title>Increased taxon sampling is advantageous for phylogenetic inference</article-title>. <source>Syst. Biol.</source> <volume>51</volume>, <fpage>664</fpage>&#x2013;<lpage>671</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10635150290102357</pub-id>, PMID: <pub-id pub-id-type="pmid">12228008</pub-id>
</mixed-citation>
</ref>
<ref id="B43">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Ren</surname> <given-names>Q.</given-names></name>
<name><surname>Wang</surname> <given-names>Y.</given-names></name>
<name><surname>Lin</surname> <given-names>Y.</given-names></name>
<name><surname>Zhen</surname> <given-names>Z.</given-names></name>
<name><surname>Cui</surname> <given-names>Y.</given-names></name>
<name><surname>Qin</surname> <given-names>S.</given-names></name>
</person-group> (<year>2021</year>). 
<article-title>The extremely large chloroplast genome of the green alga Haematococcus pluvialis: Genome structure, and comparative analysis</article-title>. <source>Algal Res.</source> <volume>56</volume>, <elocation-id>102308</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.algal.2021.102308</pub-id>
</mixed-citation>
</ref>
<ref id="B44">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Robbens</surname> <given-names>S.</given-names></name>
<name><surname>Derelle</surname> <given-names>E.</given-names></name>
<name><surname>Ferraz</surname> <given-names>C.</given-names></name>
<name><surname>Wuyts</surname> <given-names>J.</given-names></name>
<name><surname>Moreau</surname> <given-names>H.</given-names></name>
<name><surname>Van de Peer</surname> <given-names>Y.</given-names></name>
</person-group> (<year>2007</year>). 
<article-title>The complete chloroplast and mitochondrial DNA sequence of Ostreococcus tauri: organelle genomes of the smallest eukaryote are examples of compaction</article-title>. <source>Mol. Biol. Evol.</source> <volume>24</volume>, <fpage>956</fpage>&#x2013;<lpage>968</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msm012</pub-id>, PMID: <pub-id pub-id-type="pmid">17251180</pub-id>
</mixed-citation>
</ref>
<ref id="B45">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Sciuto</surname> <given-names>K.</given-names></name>
<name><surname>Lewis</surname> <given-names>L. A.</given-names></name>
<name><surname>Verleyen</surname> <given-names>E.</given-names></name>
<name><surname>Moro</surname> <given-names>I.</given-names></name>
<name><surname>La Rocca</surname> <given-names>N.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Chodatodesmus australis sp. nov. (Scenedesmaceae, Chlorophyta) from Antarctica, with the emended description of the genus Chodatodesmus, and circumscription of Flechtneria rotunda gen. et sp. nov</article-title>. <source>J. Phycol.</source> <volume>51</volume>, <fpage>1172</fpage>&#x2013;<lpage>1188</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/jpy.12355</pub-id>, PMID: <pub-id pub-id-type="pmid">26987011</pub-id>
</mixed-citation>
</ref>
<ref id="B46">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Smith</surname> <given-names>D. R.</given-names></name>
</person-group> (<year>2018</year>). 
<article-title>Haematococcus lacustris: the makings of a giant-sized chloroplast genome</article-title>. <source>AoB Plants</source> <volume>10</volume>, <elocation-id>ply058</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/aobpla/ply058</pub-id>, PMID: <pub-id pub-id-type="pmid">30393516</pub-id>
</mixed-citation>
</ref>
<ref id="B47">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Smith</surname> <given-names>D. R.</given-names></name>
</person-group> (<year>2020</year>). 
<article-title>Can green algal plastid genome size be explained by DNA repair mechanisms</article-title>? <source>Genome Biol. Evol.</source> <volume>12</volume>, <fpage>3797</fpage>&#x2013;<lpage>3802</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evaa012</pub-id>, PMID: <pub-id pub-id-type="pmid">31971558</pub-id>
</mixed-citation>
</ref>
<ref id="B48">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Smith</surname> <given-names>D. R.</given-names></name>
<name><surname>Lee</surname> <given-names>R. W.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>The mitochondrial and plastid genomes of Volvox carteri: bloated molecules rich in repetitive DNA</article-title>. <source>BMC Genomics</source> <volume>10</volume>, <elocation-id>132</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/1471-2164-10-132</pub-id>, PMID: <pub-id pub-id-type="pmid">19323823</pub-id>
</mixed-citation>
</ref>
<ref id="B49">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Smith</surname> <given-names>D. R.</given-names></name>
<name><surname>Lee</surname> <given-names>R. W.</given-names></name>
</person-group> (<year>2010</year>). 
<article-title>Low nucleotide diversity for the expanded organelle and nuclear genomes of Volvox carteri supports the mutational-hazard hypothesis</article-title>. <source>Mol. Biol. Evol.</source> <volume>27</volume>, <fpage>2244</fpage>&#x2013;<lpage>2256</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msq110</pub-id>, PMID: <pub-id pub-id-type="pmid">20430860</pub-id>
</mixed-citation>
</ref>
<ref id="B50">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Stegemann</surname> <given-names>S.</given-names></name>
<name><surname>Hartmann</surname> <given-names>S.</given-names></name>
<name><surname>Ruf</surname> <given-names>S.</given-names></name>
<name><surname>Bock</surname> <given-names>R.</given-names></name>
</person-group> (<year>2003</year>). 
<article-title>High-frequency gene transfer from the chloroplast genome to the nucleus</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>100</volume>, <fpage>8828</fpage>&#x2013;<lpage>8833</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1430924100</pub-id>, PMID: <pub-id pub-id-type="pmid">12817081</pub-id>
</mixed-citation>
</ref>
<ref id="B51">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>de Cambiaire</surname> <given-names>J.-C.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2016</year>). 
<article-title>Distinctive architecture of the chloroplast genome in the chlorodendrophycean green algae Scherffelia dubia and tetraselmis sp. CCMP 881</article-title>. <source>PloS One</source> <volume>11</volume>, <elocation-id>e0148934</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0148934</pub-id>, PMID: <pub-id pub-id-type="pmid">26849226</pub-id>
</mixed-citation>
</ref>
<ref id="B52">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>Gagnon</surname> <given-names>M.-C.</given-names></name>
<name><surname>O&#x2019;Kelly</surname> <given-names>C. J.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2009</year>). 
<article-title>The chloroplast genomes of the green algae Pyramimonas, Monomastix, and Pycnococcus shed new light on the evolutionary history of prasinophytes and the origin of the secondary chloroplasts of euglenids</article-title>. <source>Mol. Biol. Evol.</source> <volume>26</volume>, <fpage>631</fpage>&#x2013;<lpage>648</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/msn285</pub-id>, PMID: <pub-id pub-id-type="pmid">19074760</pub-id>
</mixed-citation>
</ref>
<ref id="B53">
<mixed-citation publication-type="book">
<person-group person-group-type="author">
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2018</year>). &#x201c;
<article-title>Chapter six - Evolution of the plastid genome in green algae</article-title>,&#x201d; in <source>Advances in Botanical Research</source>. Eds. 
<person-group person-group-type="editor">
<name><surname>Chaw</surname> <given-names>S.-M.</given-names></name>
<name><surname>Jansen</surname> <given-names>R. K.</given-names></name>
</person-group> (<publisher-loc>Cambridge, MA</publisher-loc>: 
<publisher-name>Academic Press</publisher-name>), <fpage>157</fpage>&#x2013;<lpage>193</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/bs.abr.2017.11.010</pub-id>
</mixed-citation>
</ref>
<ref id="B54">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2015</year>). 
<article-title>Dynamic evolution of the chloroplast genome in the green algal classes Pedinophyceae and Trebouxiophyceae</article-title>. <source>Genome Biol. Evol.</source> <volume>7</volume>, <fpage>2062</fpage>&#x2013;<lpage>2082</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/gbe/evv130</pub-id>, PMID: <pub-id pub-id-type="pmid">26139832</pub-id>
</mixed-citation>
</ref>
<ref id="B55">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Turmel</surname> <given-names>M.</given-names></name>
<name><surname>Otis</surname> <given-names>C.</given-names></name>
<name><surname>Lemieux</surname> <given-names>C.</given-names></name>
</person-group> (<year>2017</year>). 
<article-title>Divergent copies of the large inverted repeat in the chloroplast genomes of ulvophycean green algae</article-title>. <source>Sci. Rep.</source> <volume>7</volume>, <fpage>994</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-017-01144-1</pub-id>, PMID: <pub-id pub-id-type="pmid">28428552</pub-id>
</mixed-citation>
</ref>
<ref id="B56">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>T.</given-names></name>
<name><surname>Feng</surname> <given-names>H.</given-names></name>
<name><surname>Zhu</surname> <given-names>H.</given-names></name>
<name><surname>Zhong</surname> <given-names>B.</given-names></name>
</person-group> (<year>2025</year>). 
<article-title>Molecular phylogeny and comparative chloroplast genome analysis of the type species Crucigenia quadrata</article-title>. <source>BMC Plant Biol.</source> <volume>25</volume>, <fpage>64</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s12870-025-06070-3</pub-id>, PMID: <pub-id pub-id-type="pmid">39815182</pub-id>
</mixed-citation>
</ref>
<ref id="B57">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>Q.</given-names></name>
<name><surname>Hou</surname> <given-names>Y.</given-names></name>
<name><surname>Li</surname> <given-names>Y.</given-names></name>
<name><surname>Shi</surname> <given-names>Y.</given-names></name>
<name><surname>Liu</surname> <given-names>G.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Phylogenetic study on Scenedesmacae with the description of a new genus Coccoidesmus gen. nov. (Chlorophyceae, Chlorophyta) and chloroplast genome analyses</article-title>. <source>J. Oceanol. Limnol.</source> <volume>42</volume>, <fpage>1272</fpage>&#x2013;<lpage>1285</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00343-023-3139-9</pub-id>
</mixed-citation>
</ref>
<ref id="B58">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wang</surname> <given-names>Q.</given-names></name>
<name><surname>Song</surname> <given-names>H.</given-names></name>
<name><surname>Liu</surname> <given-names>X.</given-names></name>
<name><surname>Zhu</surname> <given-names>H.</given-names></name>
<name><surname>Hu</surname> <given-names>Z.</given-names></name>
<name><surname>Liu</surname> <given-names>G.</given-names></name>
</person-group> (<year>2019</year>). 
<article-title>Deep genomic analysis of Coelastrella saipanensis (Scenedesmaceae, Chlorophyta): comparative chloroplast genomics of Scenedesmaceae</article-title>. <source>Eur. J. Phycol.</source> <volume>54</volume>, <fpage>52</fpage>&#x2013;<lpage>65</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/09670262.2018.1503334</pub-id>
</mixed-citation>
</ref>
<ref id="B59">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Wicke</surname> <given-names>S.</given-names></name>
<name><surname>Schneeweiss</surname> <given-names>G. M.</given-names></name>
<name><surname>dePamphilis</surname> <given-names>C. W.</given-names></name>
<name><surname>M&#xfc;ller</surname> <given-names>K. F.</given-names></name>
<name><surname>Quandt</surname> <given-names>D.</given-names></name>
</person-group> (<year>2011</year>). 
<article-title>The evolution of the plastid chromosome in land plants: gene content, gene order, gene function</article-title>. <source>Plant Mol. Biol.</source> <volume>76</volume>, <fpage>273</fpage>&#x2013;<lpage>297</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11103-011-9762-4</pub-id>, PMID: <pub-id pub-id-type="pmid">21424877</pub-id>
</mixed-citation>
</ref>
<ref id="B60">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Xu</surname> <given-names>Y.</given-names></name>
<name><surname>Chen</surname> <given-names>X.</given-names></name>
<name><surname>Melkonian</surname> <given-names>M.</given-names></name>
<name><surname>Wang</surname> <given-names>S.</given-names></name>
<name><surname>Sahu</surname> <given-names>S. K.</given-names></name>
</person-group> (<year>2024</year>). 
<article-title>Comparative chloroplast genome analysis of two <italic>Desmodesmus</italic> species reveals genome diversity within Scenedesmaceae (Sphaeropleales, Chlorophyceae)</article-title>. <source>Protist</source> <volume>175</volume>, <elocation-id>126073</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.protis.2024.126073</pub-id>, PMID: <pub-id pub-id-type="pmid">39612570</pub-id>
</mixed-citation>
</ref>
<ref id="B61">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhao</surname> <given-names>X.</given-names></name>
<name><surname>Liu</surname> <given-names>C.</given-names></name>
<name><surname>He</surname> <given-names>L.</given-names></name>
<name><surname>Zeng</surname> <given-names>Z.</given-names></name>
<name><surname>Zhang</surname> <given-names>A.</given-names></name>
<name><surname>Li</surname> <given-names>H.</given-names></name>
<etal/>
</person-group>. (<year>2022</year>). 
<article-title>Structure and phylogeny of chloroplast and mitochondrial genomes of a chlorophycean algae Pectinodesmus pectinatus (Scenedesmaceae, Sphaeropleales)</article-title>. <source>Life Basel Switz.</source> <volume>12</volume>, <elocation-id>1912</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/life12111912</pub-id>, PMID: <pub-id pub-id-type="pmid">36431047</pub-id>
</mixed-citation>
</ref>
<ref id="B62">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zhou</surname> <given-names>W.</given-names></name>
<name><surname>Armijos</surname> <given-names>C. E.</given-names></name>
<name><surname>Lee</surname> <given-names>C.</given-names></name>
<name><surname>Lu</surname> <given-names>R.</given-names></name>
<name><surname>Wang</surname> <given-names>J.</given-names></name>
<name><surname>Ruhlman</surname> <given-names>T. A.</given-names></name>
<etal/>
</person-group>. (<year>2023</year>). 
<article-title>Plastid genome assembly using long-read data</article-title>. <source>Mol. Ecol. Resour.</source> <volume>23</volume>, <fpage>1442</fpage>&#x2013;<lpage>1457</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/1755-0998.13787</pub-id>, PMID: <pub-id pub-id-type="pmid">36939021</pub-id>
</mixed-citation>
</ref>
<ref id="B63">
<mixed-citation publication-type="journal">
<person-group person-group-type="author">
<name><surname>Zwickl</surname> <given-names>D. J.</given-names></name>
<name><surname>Hillis</surname> <given-names>D. M.</given-names></name>
</person-group> (<year>2002</year>). 
<article-title>Increased taxon sampling greatly reduces phylogenetic error</article-title>. <source>Syst. Biol.</source> <volume>51</volume>, <fpage>588</fpage>&#x2013;<lpage>598</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/10635150290102339</pub-id>, PMID: <pub-id pub-id-type="pmid">12228001</pub-id>
</mixed-citation>
</ref>
</ref-list>
<fn-group>
<fn id="n1" fn-type="custom" custom-type="edited-by">
<p>Edited by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/128276">Rafael R. Robaina</ext-link>, University of Las Palmas de Gran Canaria, Spain</p></fn>
<fn id="n2" fn-type="custom" custom-type="reviewed-by">
<p>Reviewed by: <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/387326">Zixi Chen</ext-link>, Shenzhen University, China</p>
<p><ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1019292">Jadran F. Garcia</ext-link>, University of California, Davis, United States</p></fn>
</fn-group>
</back>
</article>