<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2021.774617</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Chloroplast Genomes for Five <italic>Skeletonema</italic> Species: Comparative and Phylogenetic Analysis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Liu</surname> <given-names>Shuya</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Xu</surname> <given-names>Qing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1523765/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Liu</surname> <given-names>Kuiyan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Yongfang</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname> <given-names>Nansheng</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1058005/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>CAS Key Laboratory of Marine Ecology and Environmental Sciences, Institute of Oceanology, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Functional Laboratory of Marine Ecology and Environmental Science, Qingdao National Laboratory for Marine Science and Technology</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Center for Ocean Mega-Science, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>College of Life Science and Technology, Huazhong Agricultural University</institution>, <addr-line>Wuhan</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>College of Marine Science, University of Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>Jiaozhou Bay National Marine Ecosystem Research Station, Institute of Oceanology, Chinese Academy of Sciences</institution>, <addr-line>Qingdao</addr-line>, <country>China</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Molecular Biology and Biochemistry, Simon Fraser University</institution>, <addr-line>Burnaby, BC</addr-line>, <country>Canada</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Koichiro Awai, Shizuoka University, Japan</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Yoshihisa Hirakawa, University of Tsukuba, Japan; Denis Baurain, University of Li&#x00E8;ge, Belgium</p></fn>
<corresp id="c001">&#x002A;Correspondence: Nansheng Chen, <email>chenn@qdio.ac.cn</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Marine and Freshwater Plants, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>13</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>774617</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>22</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Liu, Xu, Liu, Zhao and Chen.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Liu, Xu, Liu, Zhao and Chen</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p><italic>Skeletonema</italic> species are cosmopolitan coastal diatoms that exhibit important roles in ecological system. The chloroplast genomes (cpDNAs) have been proven to be important in the study of molecular evolution and genetic diversity. However, cpDNA of only a single <italic>Skeletonema</italic> species (<italic>S. pseudocostatum</italic>) has been constructed, hindering in-depth investigation on <italic>Skeletonema</italic> species. In this study, complete cpDNAs of five <italic>Skeletonema</italic> species were constructed with cpDNAs of four species <italic>S. marinoi</italic>, <italic>S. tropicum</italic>, <italic>S. costatum</italic>, and <italic>S. grevillea</italic> constructed for the first time. These cpDNAs had similar sizes and same numbers of genes. These cpDNAs were highly syntenic with no substantial expansions, contractions, or inversions. Interestingly, two copies of <italic>petF</italic>, which encodes ferredoxin with critical role in iron dependency, were found in all five <italic>Skeletonema</italic> species, with one copy in the cpDNA and another copy in the nuclear genome of each species. Selection analysis revealed that all PCGs of cpDNAs were undergoing purifying selection. Despite the high conservation of these cpDNAs, nine genomic regions with high sequence divergence were identified, which illustrated substantial variations that could be used as markers for phylogenetic inference and for tracking <italic>Skeletonema</italic> species in the field. Additionally, the numbers of simple sequence repeats varied among different cpDNAs, which were useful for detecting genetic polymorphisms. The divergence times estimated using PCGs of cpDNAs revealed that most of these species were established within &#x223C;33 Mya, consistent with that estimated using mtDNAs. Overall, the current study deepened our understanding about the molecular evolution of <italic>Skeletonema</italic> cpDNAs.</p>
</abstract>
<kwd-group>
<kwd><italic>Skeletonema</italic> species</kwd>
<kwd>chloroplast genomes</kwd>
<kwd>comparative genomics</kwd>
<kwd>divergence time</kwd>
<kwd>phylogenetic analysis</kwd>
<kwd>PETF</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="66"/>
<page-count count="14"/>
<word-count count="9346"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p>The chloroplasts are organelles for photosynthesis and other biochemical pathways in plants and algae (<xref ref-type="bibr" rid="B20">Halliwell, 1984</xref>). Chloroplast genomes (cpDNAs) represent maternal inheritance. A typical cpDNA has a highly conserved circular DNA arrangement with a quadripartite structure with a pair of inverted repeats (IRs: IRA and IRB), which are separated from the large-single copy (LSC) region and the small-single copy (SSC) region (<xref ref-type="bibr" rid="B48">Sabir et al., 2014</xref>; <xref ref-type="bibr" rid="B38">Liu and Pang, 2016</xref>; <xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>; <xref ref-type="bibr" rid="B1">Abdullah et al., 2021</xref>; <xref ref-type="bibr" rid="B33">Kim et al., 2021</xref>). Research on cpDNAs complements researches on mitochondrial genomes (mtDNAs), which also present uniparental inheritance, and the nuclear genomes (<xref ref-type="bibr" rid="B15">Gould et al., 2008</xref>; <xref ref-type="bibr" rid="B12">Garg and Gould, 2016</xref>; <xref ref-type="bibr" rid="B62">Xu et al., 2017</xref>). Complete cpDNA sequences have been widely accepted as an informative and valuable source for understanding evolutionary biology and ecological applications (<xref ref-type="bibr" rid="B22">Hamsher et al., 2019</xref>; <xref ref-type="bibr" rid="B54">Song et al., 2020</xref>).</p>
<p>As one of the most diverse and ecologically important groups in phytoplankton, diatoms (Bacillariophyta) contribute about one-fifth of the total photosynthesis on earth (<xref ref-type="bibr" rid="B3">Armbrust, 2009</xref>; <xref ref-type="bibr" rid="B42">Malviya et al., 2016</xref>). The plastids of Bacillariophyta were derived by a second endosymbiosis in which red algae were taken up by a eukaryotic heterotroph (<xref ref-type="bibr" rid="B4">Armbrust et al., 2004</xref>; <xref ref-type="bibr" rid="B3">Armbrust, 2009</xref>). With time, genes from the red algae were transferred to the host nuclear genomes and many photosynthetic proteins were now encoded in the nuclear genomes, synthesized in the cytoplasm and imported into the chloroplast (<xref ref-type="bibr" rid="B15">Gould et al., 2008</xref>; <xref ref-type="bibr" rid="B12">Garg and Gould, 2016</xref>). Such endosymbiotic gene transfers (EGTs) may be critical in evolution. For example, the transfer of the <italic>petF</italic> gene, which encodes for ferredoxin with critical role in iron dependency was found to be transferred from the cpDNA to the nuclear genome in the diatom <italic>Thalassiosira oceanica</italic> (<xref ref-type="bibr" rid="B41">Lommer et al., 2010</xref>; <xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>). This transfer may be critical for this diatom species to adapt to the low-iron ocean regions (<xref ref-type="bibr" rid="B56">Strzepek and Harrison, 2004</xref>).</p>
<p>The phylum Bacillariophyta is estimated to have 12,000 - 30,000 species (<xref ref-type="bibr" rid="B42">Malviya et al., 2016</xref>). In contrast, cpDNAs of only 55 Bacillariophyta species have been constructed, hindering further research on the evolution of Bacillariophyta species. Thus, construction and analysis of more Bacillariophyta cpDNAs are urgently needed for understanding their evolutionary history.</p>
<p>The genus <italic>Skeletonema</italic>, which belongs to Skeletonemataceae family, Thalassiosirales order, Mediophyceae class in Bacillariophyta, consisted of 21 taxonomically accepted species (<xref ref-type="bibr" rid="B49">Sarno et al., 2005</xref>, <xref ref-type="bibr" rid="B50">2007</xref>; <xref ref-type="bibr" rid="B18">Guiry and Guiry, 2021</xref>). <italic>Skeletonema</italic> species have a cosmopolitan distribution and are usually dominant phytoplankton in the coastal seawaters and estuaries (<xref ref-type="bibr" rid="B34">Kooistra et al., 2008</xref>; <xref ref-type="bibr" rid="B39">Liu et al., 2020</xref>; <xref ref-type="bibr" rid="B8">Cui et al., 2021</xref>). As an important primary producer, <italic>Skeletonema</italic> species provide food source for the higher trophic levels (<xref ref-type="bibr" rid="B34">Kooistra et al., 2008</xref>). Many <italic>Skeletonema</italic> species, including <italic>S. marinoi</italic>, <italic>S. costatum</italic>, and <italic>S. pseudocostatum</italic>, can form harmful algae blooms (HABs) with negative impact on environments (<xref ref-type="bibr" rid="B14">Godhe et al., 2006</xref>; <xref ref-type="bibr" rid="B51">Shuya and Nansheng, 2021</xref>). For example, high concentrations of <italic>Skeletonema</italic> species utilize nutrients necessary for other species, and also could cause hypoxia or anoxia (<xref ref-type="bibr" rid="B43">Mohamed, 2018</xref>). For their easy survival, fast growth, and absence of toxins, <italic>Skeletonema</italic> species are often used as food source for aquaculture (<xref ref-type="bibr" rid="B23">Hemaiswarya et al., 2011</xref>). Because of high ecological relevance, <italic>Skeletonema</italic> species are also used as the model phytoplankton species for genetic diversity and physiological adaptation studies (<xref ref-type="bibr" rid="B27">Johansson et al., 2019</xref>). For example, <xref ref-type="bibr" rid="B19">Haernstroem et al. (2011)</xref> used <italic>S. marinoi</italic> as a model organism, and studied the genetic structure and diversity of <italic>S. marinoi</italic> in sediment core accumulated over a 100 years. However, genomic resources of <italic>Skeletonema</italic> species are limited. For example, cpDNA of only a single <italic>Skeletonema</italic> species, <italic>S. pseudocostatum</italic>, has been constructed (<xref ref-type="bibr" rid="B21">Hamedi et al., 2019</xref>).</p>
<p>The aims of our study are: (1) to provide complete cpDNA sequences in <italic>Skeletonema</italic> genus for further comparative analysis; (2) to find suitable molecular markers to distinguish <italic>Skeletonema</italic> species in species level for ecological application; (3) to understand the genetic and evolutionary characteristics in cpDNAs of <italic>Skeletonema</italic> species. In this study, we successfully constructed complete cpDNAs of five <italic>Skeletonema</italic> species (total six <italic>Skeletonema</italic> strains) and analyzed their genomic structures, phylogenetic relationships, nucleotide substitutions, simple sequence repeats (SSRs), and divergence times, as well as the duplicative transfer of <italic>petF</italic> gene to the nucleus.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Strain Isolation, DNA Sequencing, cpDNA Construction and Annotation</title>
<p>In this study six <italic>Skeletonema</italic> strains were analyzed, and they were isolated from the coastal waters of China including the Bohai Sea (CNS00100), the Jiaozhou Bay (CNS00166), the Yellow Sea (CNS00243), the Changjiang Estuary (CNS00303), the Beibu Gulf (CNS00342), and the South China Sea (CNS00438), respectively, using single-cell capillary method. They were cultured in the L1 medium (<xref ref-type="bibr" rid="B17">Guillard and Hargraves, 1993</xref>). The DNA extraction and sequencing were same as described previously (<xref ref-type="bibr" rid="B61">Wang et al., 2021</xref>).</p>
<p>The complete cpDNAs were assembled using GetOrganelle (<xref ref-type="bibr" rid="B26">Jin et al., 2020</xref>) using MK372941 (<italic>S. pseudocostatum</italic>) as a reference. The cpDNAs were then validated by aligning sequencing reads against the cpDNAs using BWA (<xref ref-type="bibr" rid="B36">Li and Durbin, 2009</xref>) and SAMtools (<xref ref-type="bibr" rid="B37">Li et al., 2009</xref>), and the alignments were inspected using IGV (<xref ref-type="bibr" rid="B57">Thorvaldsdottir et al., 2013</xref>). After validation, the cpDNAs were annotated using MFannot<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> with genetic code of 11 Bacterial, Archaeal and Plant Plastid, and were then validated using ORF Finder<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>. To compare with published cpDNAs accurately, we have also inspected and re-annotated the 55 cpDNAs in Bacillariophyta from NCBI. The physical maps of the circular cpDNAs of six <italic>Skeletonema</italic> species were generated with Organellar Genome DRAW (OGDRAW) (<xref ref-type="bibr" rid="B16">Greiner et al., 2019</xref>). The quadripartite structures of <italic>Skeletonema</italic> cpDNAs were analyzed using Annotation of Organellar Genomes (GeSeq) (<xref ref-type="bibr" rid="B58">Tillich et al., 2017</xref>). The AT-skew and GC-skew were calculated according to the formulae: AT-skew = (A &#x2212; T)/(A + T) and GC-skew = (G &#x2212; C)/(G + C).</p>
</sec>
<sec id="S2.SS2">
<title>Synteny Analysis and Sequence Divergence Analysis</title>
<p>Synteny analysis of six cpDNAs was carried out using Mauve (<xref ref-type="bibr" rid="B9">Darling et al., 2010</xref>). Gene arrangements of IR regions were plotted using the R package gggenes (<xref ref-type="bibr" rid="B10">David, 2020</xref>). Alignments of six <italic>Skeletonema</italic> cpDNA sequences were visualized using mVISTA in the Shuffle-LAGAN mode (<xref ref-type="bibr" rid="B11">Frazer et al., 2004</xref>) with the <italic>S. marinoi</italic> cpDNA (MW679506) as a reference sequence. Nucleotide diversity analysis of cpDNAs was conducted using the DnaSP (<xref ref-type="bibr" rid="B46">Rozas et al., 2017</xref>) by sliding window (step size = 200 bp, window length = 600 bp).</p>
<p>Based on the results of nucleotide diversity, nine regions with high sequence divergence were identified. The primers of these regions were designed using the Primer Premier 5.0 (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 1</xref>) (<xref ref-type="bibr" rid="B52">Singh et al., 1998</xref>). PCRs were performed in volumes of 50 &#x03BC;L containing 2 &#x03BC;L diluted template DNA (about 50 ng), 1 &#x03BC;L forward primer (10 &#x03BC;mol/L), 1 &#x03BC;L reverse primer (10 &#x03BC;mol/L), 25 &#x03BC;L mix (Tiangen, China) and 21 &#x03BC;L ddH<sub>2</sub>O. The reactions were denatured at 94&#x00B0;C for 4 min. Then, the reactions were run for 32 cycles at 94&#x00B0;C for 1 min, 52&#x00B0;C for 1 min 50 s, and 72&#x00B0;C for 2 min and a final extension at 72&#x00B0;C for 10 min. These PCR products were run on 1% agarose gels for checking amplicon lengths.</p>
</sec>
<sec id="S2.SS3">
<title>Phylogenetic Analysis</title>
<p>The phylogenetic trees of the nine regions were generated using the Maximum Likelihood (ML) method with 1000 bootstrap replicates in megaX (<xref ref-type="bibr" rid="B35">Kumar et al., 2018</xref>). The best-fit models were Tamura 3-parameter (T92 + G) for all regions except for CpVIII with General Time Reversible (GTR + G) model, which were obtained by Models.</p>
<p>Phylogenetic relationships within the 61 Bacillariophyta cpDNAs (six cpDNAs were constructed in this study and 55 cpDNAs were downloaded from NCBI) and one outgroup (<italic>Triparma laevis</italic>) were analyzed based on the 86 shared protein-coding genes (PCGs) among them. Amino acid sequence of 86 genes, including <italic>atpA, atpB, atpD, atpE, atpF, atpG, atpI, ccs1, ccsA, chlI, clpC, dnaB, ftsH, groEL, petA, petB, petD, petG, petL, petM, petN, psaA, psaB, psaD, psaF, psaJ, psbB, psbC, psbD, psbE, psbF, psbH, psbI, psbJ, psbK, psbL, psbN, psbT, psbV, psbX, psbY, rbcL, rbcS, rpl11, rpl12, rpl13, rpl14, rpl16, rpl18, rpl19, rpl1, rpl20, rpl23, rpl24, rpl29, rpl2, rpl31, rpl34, rpl35, rpl3, rpl4, rpl5, rpl6, rpoA, rpoB, rpoC1, rpoC2, rps10, rps11, rps12, rps13, rps14, rps16, rps17, rps18, rps20, rps2, rps3, rps4, rps5, rps7, rps9, secA, secY, tatC, and ycf3</italic>, were individually aligned by MAFFT (<xref ref-type="bibr" rid="B31">Katoh and Standley, 2013</xref>), trimmed by trimAl (<xref ref-type="bibr" rid="B7">Capella-Gutierrez et al., 2009</xref>), and concatenated by Phyutility (<xref ref-type="bibr" rid="B53">Smith and Dunn, 2008</xref>). The model for the phylogenetic tree was LG + F + R10, which was obtained by ModelFinder (<xref ref-type="bibr" rid="B29">Kalyaanamoorthy et al., 2017</xref>). Phylogenetic tree was constructed by IQ-TREE (<xref ref-type="bibr" rid="B59">Trifinopoulos et al., 2016</xref>) with SH-aLRT support (%)/aBayes support/ultrafast bootstrap support (%) and displayed by FigTree<sup><xref ref-type="fn" rid="footnote3">3</xref></sup>.</p>
</sec>
<sec id="S2.SS4">
<title>Simple Sequence Repeat Analysis and Selection Analysis</title>
<p>MISA (<xref ref-type="bibr" rid="B6">Beier et al., 2017</xref>) was used to search for SSRs in the cpDNA of <italic>Skeletonema</italic> species. The minimum number repeats were 10, 5, 4, 3, 3, and 3 for mono-, di-, tri-, tetra-, penta-, and hexa-nucleotides, respectively.</p>
<p>To estimate selection pressure, the rates of non-synonymous (Ka) and synonymous (Ks) substitutions were analyzed by KaKs_calculator2 (<xref ref-type="bibr" rid="B60">Wang et al., 2010</xref>). Ka/Ks values &#x003E; 1 indicated positive selection; and Ka/Ks &#x003C; 1 indicated purifying selection. Each PCG was calculated pairwise between two <italic>Skeletonema</italic> species, respectively. The results divided into different functional groups (same to <xref ref-type="fig" rid="F1">Figure 1</xref> generated by OGDRAW) were visualized by the box charts using the R package ggpubr (<xref ref-type="bibr" rid="B30">Kassambara, 2020</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Chloroplast genomes of six <italic>Skeletonema</italic> strains <bold>(A&#x2013;F)</bold> constructed in this study. Genes inside and outside of the circle are transcribed clockwise and counterclockwise, respectively. Genes belonging to different functional groups are shown in different colors. The LSC and SSC regions are separated by the inverted repeats (IRA and IRB). Dark and light gray colors in the inner circle correspond to the GC and AT content, respectively.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g001.tif"/>
</fig>
</sec>
<sec id="S2.SS5">
<title>Divergence Time Estimations</title>
<p>Molecular dating analysis was conducted by 96 cpDNA PCGs with DNA sequences in the Class Mediophyceae. The 96 PCGs were <italic>atpA, atpB, atpD, atpE, atpF, atpG, atpH, atpI, ccs1, ccsA, chlI, clpC, dnaB, dnaK, ftsH, groEL, petA, petB, petD, petG, petL, petM, petN, psaA, psaB, psaC, psaD, psaF, psaJ, psaL, psbB, psbC, psbD, psbE, psbF, psbH, psbI, psbJ, psbK, psbL, psbN, psbT, psbV, psbW, psbX, psbY, rbcL, rbcS, rpl1,rpl2,rpl3,rpl4,rpl5,rpl6,rpl11, rpl12, rpl13, rpl14, rpl16, rpl18, rpl19, rpl20, rpl23, rpl24,rpl29,rpl31,rpl34,rpl35, rpoA, rpoB, rpoC1, rpoC2, rps2, rps3, rps4, rps5, rps7, rps8, rps9, rps10, rps11, rps12, rps13, rps14, rps16, rps17, rps18, rps19, rps20, secA, secY, tatC, ycf3, ycf4, ycf39</italic>, and <italic>ycf41</italic>. These genes were analyzed in the PhyloSuite (<xref ref-type="bibr" rid="B66">Zhang et al., 2020</xref>), including alignment by Mafft, concatenation by Concatenate Sequence, finding the best-fit evolutionary model by PartitionFinder2 and phylogenetic trees construction using MrBayes methods. Molecular dating was performed using the PAML package (<xref ref-type="bibr" rid="B64">Yang, 2007</xref>). Two calibration points were used in the analysis (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 2</xref>), including <italic>Synedra</italic> and <italic>Fragilaria</italic> (<xref ref-type="bibr" rid="B44">Nakov et al., 2018</xref>), <italic>Ectocarpus siliculosus</italic> and Bacillariophyta (<xref ref-type="bibr" rid="B3">Armbrust, 2009</xref>). The phylogenetic tree was visualized in the FigTree with 95% highest posterior density interval (HPD).</p>
</sec>
<sec id="S2.SS6">
<title>Gene Structure and Phylogenetic Analysis of <italic>petF</italic> Gene Among <italic>Skeletonema</italic> Species</title>
<p>To obtain scaffolds, clean data were assembled independently using Platanus (<xref ref-type="bibr" rid="B28">Kajitani et al., 2019</xref>), SPAdes (<xref ref-type="bibr" rid="B5">Bankevich et al., 2012</xref>), and ABySS (<xref ref-type="bibr" rid="B25">Jackman et al., 2017</xref>). To find <italic>petF</italic> genes encoded in the nuclear genome, sequences of <italic>petF</italic> of published <italic>Skeletonema</italic> species (<xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>) were used as references to find the target scaffolds using BLAST (tblastn). Because some software failed to assemble the target scaffolds or the assembly was too fragmented, we combined and compared results of tree assembly software. The target scaffolds were further annotated using genewise<sup><xref ref-type="fn" rid="footnote4">4</xref></sup> (<xref ref-type="bibr" rid="B13">GeneWise, 2008</xref>). Phylogenetic analysis of <italic>petF</italic> genes from cpDNAs and nuclear genomes of <italic>Skeletonema</italic> species were analyzed based on peptide sequences using the Maximum Likelihood (ML) method with 1000 bootstrap replicates in megaX (<xref ref-type="bibr" rid="B35">Kumar et al., 2018</xref>). The best-fit model was WAG + G selected by Models. <italic>petF</italic> gene structures were visualized using Gene Structure Display Server (<xref ref-type="bibr" rid="B24">Hu et al., 2015</xref>). Four <italic>Thalassiosira</italic> species were added for comparison: The <italic>petF</italic> genes of <italic>T. pseudonana</italic> (EF067921) and <italic>T. weissflogii</italic> (KJ958485) were encoded in cpDNA, and the <italic>petF</italic> genes of <italic>T. oceanica</italic> (EJK54785) and <italic>T. rotula</italic> (MMETSP0913) were encoded by the nuclear genomes (<xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>).</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>Results</title>
<sec id="S3.SS1">
<title>General Characteristics of Chloroplast Genomes</title>
<p>In this study, we constructed complete cpDNAs of six <italic>Skeletonema</italic> strains (CNS00100, CNS00166, CNS00243, CNS00303, CNS00342, and CNS00438) isolated from Chinese coastal seawaters. These six <italic>Skeletonema</italic> strains were annotated as <italic>S. marinoi</italic>, <italic>S. tropicum</italic>, <italic>S. costatum</italic>, <italic>S. costatum</italic>, <italic>S. pseudocostatum</italic>, and <italic>S. grevillei</italic>, respectively, based on their morphological features and similarity to corresponding reference molecular markers (<xref ref-type="bibr" rid="B40">Liu et al., 2021</xref>). Although CNS00243 and CNS00303 were identified as different <italic>Skeletonema</italic> species originally, both the strains were proved to be <italic>S. costatum</italic> by our recent study (<xref ref-type="bibr" rid="B40">Liu et al., 2021</xref>). By now, the cpDNA of only a single <italic>Skeletonema</italic> species, which is <italic>S. pseudocostatum</italic>, has been constructed (<xref ref-type="bibr" rid="B21">Hamedi et al., 2019</xref>). The cpDNAs of all <italic>Skeletonema</italic> species analyzed in this study showed the typical quadripartite structure in which LSC and SSC regions were separated by a pair of inverted repeats (IRA and IRB) (<xref ref-type="fig" rid="F1">Figure 1</xref>). The sizes of these cpDNAs were very similar, ranging from 126,883 bp (<italic>S. grevillei</italic>) to 127,353 bp (<italic>S. costatum</italic> of CNS303 strain) (<xref ref-type="table" rid="T1">Table 1</xref>). The sizes of LSCs varied from 63,849 bp (<italic>S. grevillei</italic>) to 64,143 bp (<italic>S. costatum</italic> of both CNS00243 and CNS00303 strains), the sizes of SSCs varied from 26,508 bp (<italic>S</italic>. <italic>pseudocostatum</italic>) to 26,707 bp (<italic>S. costatum</italic> of CNS303 strain), and the sizes of IRs varied from 18,210 bp (<italic>S. grevillei</italic>) to 18,252 bp (<italic>S. costatum</italic> of both CNS00243 and CNS00303 strains). The AT contents of these cpDNAs were also very similar, ranging from 68.42 to 69.29% (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>The Summary of complete cpDNA feature of the <italic>Skeletonema</italic> species.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<tbody>
<tr>
<td><inline-graphic xlink:href="fpls-12-774617-t001.jpg"/></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p><italic>The strains in blue color were isolated in this study.</italic></p></fn>
</table-wrap-foot>
</table-wrap>
<p>Consistent with the high similarity of genome sizes and AT contents of these <italic>Skeletonema</italic> species, their gene contents were identical, including 141 PCGs, 31 tRNAs, six rRNAs, one non-coding RNA (ncRNA), and one transfer-messenger RNA (tmRNA) (<xref ref-type="table" rid="T1">Table 1</xref>). No introns were identified in these six cpDNAs. As expected, the combined lengths corresponding to PCGs were the largest, followed by that corresponding to rRNAs, intergenic spacer regions (ISRs), tRNAs, tmRNAs and ncRNAs (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 3</xref>). The sizes of 141 PCGs were rather different, ranging from 90 bp (<italic>petN</italic>) to 4338 bp (<italic>rpoC2</italic>) (<xref ref-type="fig" rid="F2">Figure 2A</xref>). The AT contents did not show much differences among these categories (<xref ref-type="fig" rid="F2">Figure 2B</xref>). The nucleotide skew analysis showed that all the <italic>Skeletonema</italic> cpDNAs exhibited a moderate positive GC-skew (0.0012&#x2013;0.0047) and a more prominent AT-skew (0.029&#x2013;0.032) (<xref ref-type="fig" rid="F2">Figures 2C,D</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>General features of the <italic>Skeletonema</italic> cpDNAs. <bold>(A)</bold> Sizes and <bold>(B)</bold> AT contents of PCG, rRNA, tRNA, ncRNA, tmRNA, and intergenic spacer region (ISR) for the six <italic>Skeletonema</italic> cpDNAs. <bold>(C)</bold> Relationships between G + C contents and GC skews, <bold>(D)</bold> Relationships between A + T contents and AT skews of <italic>Skeletonema</italic> cpDNAs and other 55 published Bacillariophyta cpDNAs.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g002.tif"/>
</fig>
</sec>
<sec id="S3.SS2">
<title>Synteny Analysis and Nucleotide Diversity Analysis</title>
<p>Alignment of six <italic>Skeletonema</italic> cpDNAs using Mauve revealed highly similar gene arrangements (<xref ref-type="fig" rid="F3">Figure 3A</xref>). No expansion or contraction of IR was observed among these <italic>Skeletonema</italic> cpDNAs (<xref ref-type="fig" rid="F3">Figure 3B</xref>). Sequence identity analysis by mVISTA (<xref ref-type="fig" rid="F3">Figure 3C</xref>) also revealed high similarity across the cpDNAs, with higher conservation observed for PCGs than non-coding regions. The nucleotide diversity exhibited different patterns in the quadripartite structures (<xref ref-type="fig" rid="F3">Figure 3D</xref>), with higher conservation of the IR regions than the LSC and SSC regions.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Gene order comparison and the sequence divergence analysis of six <italic>Skeletonema</italic> chloroplast genomes. <bold>(A)</bold> Synteny comparison of the six <italic>Skeletonema</italic> cpDNAs using Mauve analysis. Rectangular blocks of the same color indicate collinear regions. <bold>(B)</bold> Gene arrangements in the inverted repeats (IR) regions of <italic>Skeletonema</italic> cpDNAs. The colors of genes are same with that in the <xref ref-type="fig" rid="F1">Figure 1</xref>, indicating the different functional groups. <bold>(C)</bold> Identity plot comparing the cpDNA of six <italic>Skeletonma</italic> strains using mVISTA. The <italic>S. marinoi</italic> cpDNA (MW679506) is selected as the reference sequence. The vertical scale on the left indicated the identity percentages (range shown: 50&#x2013;100%). The arrow with light gray named contig on the horizontal axis indicate the cpDNAs of <italic>Skeletonema</italic>. The dark gray arrows above the alignments indicate gene orientation. Genome regions are colored as exon, untranslated region (UTR) and conserved non-coding sequences (CNS). <bold>(D)</bold> Nucleotide diversity (Pi) of the <italic>Skeletonema</italic> cpDNA sequences based on sliding window analysis. The window length is 600 bp and the step size is 200 bp. The horizontal axis indicate the position of the midpoint of a window. The vertical axis indicate the nucleotide diversity of each window. The nine regions with great sequence divergence are also shown in the <bold>(C,D)</bold>, named CpI, CpII, to CpIX.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g003.tif"/>
</fig>
<p>Despite the well-conserved genomic structure, we identified nine regions with enhanced variations based on the sequence divergence analysis (<xref ref-type="fig" rid="F3">Figures 3C,D</xref>). These regions, which were named CpI, CpII, CpIII, CpIV, CpV, CpVI, CpVII, CpVIII and CpIX, located in <italic>rpl19 - petF- psaB</italic>, <italic>ycf89 - rns</italic> (IRA), <italic>dnaK - rpl3, clpC - thiG - trnN, rns - ycf89</italic> (IRB), <italic>ycf33 - trnT, chlI - petA, rpl33 - rps20 - rpoB, rpl12 - rpl1</italic>, respectively. The sequences of CpII and CpV regions are identical because they are symmetrically arranged in the IR. To evaluate the divergence of the nine regions, we carried out phylogenetic analysis of these DNA sequences, which showed that these nine regions could all successfully separate all five <italic>Skeletonema</italic> species (<xref ref-type="fig" rid="F4">Figure 4A</xref>). Thus, all of these divergent regions can be used as specific molecular markers for distinguishing different <italic>Skeletonema</italic> species (<xref ref-type="fig" rid="F4">Figures 4B,C</xref>). To test this idea, we have designed primers for amplifying the CpIII region and have successfully amplified this region in all strains (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1</xref> and <xref ref-type="table" rid="T1">Table 1</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Nine suitable regions were suitable as barcodes or molecular markers. <bold>(A)</bold> Phylogenetic analysis of the nine regions among <italic>Skeletonema</italic> species. DNA alignment information <bold>(B)</bold> and agarose gels image of PCR products <bold>(C)</bold> for CpIII region among the <italic>Skeletonema</italic> species. The bands sequences are <italic>S. marinoi</italic>, <italic>S. tropicum</italic>, <italic>S. costatum</italic> (CNS00243 strain), <italic>S. costatum</italic> (CNS00303 strain), <italic>S. pseudocostatum</italic>, and <italic>S. grevillea</italic>, respectively. The bands of Marker M1 and M2 are shown on both sides. The sequence of CpII region is equal to the CpV region.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g004.tif"/>
</fig>
</sec>
<sec id="S3.SS3">
<title>Phylogenetic Analysis of <italic>Skeletonema</italic> Species</title>
<p>To explore the evolutionary relationships of <italic>Skeletonema</italic> among the Bacillariophyta species, the phylogenetic tree was constructed using a set of 86 chloroplast PCGs shared by 62 cpDNAs (<xref ref-type="fig" rid="F5">Figure 5</xref>). The phylogenetic tree showed the species in Bacillariophyta were divided into three distinct taxa, which generally corresponded to three classes Bacillariophyceae, Mediophyceae and Coscinodiscophyceae with one exception. <italic>Leptocylindrus danicus</italic> split from other species at the base of the phylogenetic tree and clustered with Coscinodiscophyceae species, suggesting that it was a member of the class Coscinodiscophyceae (<xref ref-type="fig" rid="F5">Figure 5</xref>). This annotation of <italic>L. danicus</italic> was consistent with the previous study (<xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>), but was inconsistent with Algaebase (<xref ref-type="bibr" rid="B18">Guiry and Guiry, 2021</xref>), which indicated that this species belonged to the class Mediophyceae. <italic>Astrosyne radiata</italic> (MG755807) belonging to Bacillariophyceae was found to have the longest branch, which was consistent with the previous study (<xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>) and also reported <italic>A. radiata</italic> exhibited a high level of gene order rearrangement.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Phylogenetic tree based on concatenated amino acid sequences of 86 chloroplast PCGs. The six <italic>Skeletonema</italic> strains (in blue color) and other 55 Bacillariophyta species, which have been reported the cpDNAs, are included. <italic>Triparma laevis</italic> is used as outgroup taxa.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g005.tif"/>
</fig>
<p>As expected, <italic>Skeletonema</italic> species clustered together and formed a monophyletic group close to <italic>Thalassiosira</italic> species. Within <italic>Skeletonema</italic>, the two <italic>S. costatum</italic> strains (MW679508 and MW679509) formed an independent clade, which was sister to the rest of the <italic>Skeletonema</italic> species with 100% bootstrap support. The two <italic>S. pseudocostatum</italic> strains (MW679510 and MK372942), which were isolated from China and Algeria, respectively, clustered together as expected. The clade of <italic>S. pseudocostatum</italic> and <italic>S. tropicum</italic> clustered with the <italic>S. marinoi</italic> (MW679506). The clade including <italic>S. pseudocostatum</italic>, <italic>S. tropicum</italic> and <italic>S. marinoi</italic> was a sister to the clade with a single species: <italic>S. grevillei</italic> (MW679511).</p>
</sec>
<sec id="S3.SS4">
<title>Selection Analysis and SSR Analysis of the <italic>Skeletonema</italic> cpDNAs</title>
<p>The pairwise substitution rates (Ka/Ks) between the <italic>Skeletonema</italic> species were calculated using PCGs of cpDNA. In this study, the Ka/Ks ratio for all PCGs of all pairwise species comparison was below 1 (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2</xref>), suggesting purifying selection. Interestingly, the <italic>rbcL</italic> and <italic>rbcS</italic> genes encoding to RubisCO subunit showed higher Ka/Ks ratio than genes belonging to other functional groups.</p>
<p>The distributions of SSRs among <italic>Skeletonema</italic> cpDNAs were analyzed using MISA (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 4</xref>). The lengths of SSRs ranged from 10 bp to 22 bp. Most SSRs are A/T type rather than the G/C type. Among the six detected categories, the most abundant were tetra-nucleotide repeats for all <italic>Skeletonema</italic> cpDNAs, accounting for 33.33% (<italic>S. marinoi</italic>)&#x2013;41.38% (<italic>S. costatum</italic>). The penta-nucleotide repeat was only found in the cpDNAs of <italic>S. costatum</italic>. The number of SSRs located in the ISRs (52.17&#x2013;63.89%) was slightly higher than that located within the genes (36.11&#x2013;47.83%). Among the quadripartite structure of <italic>Skeletonema</italic> cpDNAs, SSRs were mainly located in the LSC regions (47.83&#x2013;53.33%). We found that there was one more SSR (i.e., tetra-nucleotide repeat) in the <italic>S. pseudocostatum</italic> cpDNA (MW679510) of the Chinese strain than that in <italic>S. pseudocostatum</italic> cpDNA (MK372941) of the Algerian strain.</p>
</sec>
<sec id="S3.SS5">
<title>Divergence Time Estimation Based on the cpDNAs</title>
<p>The divergence times of <italic>Skeletonema</italic> species was estimated based on 96 PCGs shared by cpDNAs of 33 species (<xref ref-type="fig" rid="F6">Figure 6</xref>). The divergence time of the <italic>Skeletonema</italic> genus, which formed an independent clade apart from the <italic>Thalassiosira</italic> genus, was estimated to be 46 Million years ago (Mya; 95% HPD: 32.50&#x2013;59.23 Mya). Within the <italic>Skeletonema</italic> genus, <italic>S. grevillei</italic> diverged from other <italic>Skeletonema</italic> species around 33 Mya (95% HPD: 18.54&#x2013;47.83 Mya). The two HAB species <italic>S. marinoi</italic> and <italic>S. pseudocostatum</italic> diverged approximately 16 Mya (95% HPD 5.66&#x2013;29.85 Mya).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Time-calibrated phylogeny of 33 diatom taxa based on 96 chloroplast genes with PAML. The red dots represented calibration point and translucent blue bars represented the 95% highest posterior density interval of each node ages.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g006.tif"/>
</fig>
</sec>
<sec id="S3.SS6">
<title>Co-existence of Two Copies of <italic>petF</italic> in <italic>Skeletonema</italic> Species</title>
<p>The cpDNA gene <italic>petF</italic> has been frequently found to be transferred from cpDNA to nuclear genomes in diatom species (<xref ref-type="bibr" rid="B41">Lommer et al., 2010</xref>; <xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>). The transfer of <italic>petF</italic> has been proposed as a molecular mechanism underlying iron intake efficacy (<xref ref-type="bibr" rid="B56">Strzepek and Harrison, 2004</xref>). A copy of the <italic>petF</italic> gene was found in each of the <italic>Skeletonema</italic> cpDNA (<xref ref-type="fig" rid="F7">Figure 7A</xref>). However, gene annotation of assembled nuclear genomes of all five <italic>Skeletonema</italic> species revealed that the <italic>petF</italic> genes were also found in all of these <italic>Skeletonema</italic> nuclear genomes (<xref ref-type="fig" rid="F7">Figure 7A</xref>), suggesting that <italic>petF</italic> gene transfer did occur in evolution. A typical signal peptide was found at the N-terminal of each nuclear <italic>petF</italic>-encoded peptide, suggesting their role in chloroplast (<xref ref-type="fig" rid="F7">Figure 7B</xref>). Phylogenetic analysis of <italic>petF</italic> genes found in the cpDNAs and nuclear genomes uncovered that all cpDNA-encoded <italic>petF</italic> genes clustered together in one clade (including <italic>T. pseudonana</italic> and <italic>T. weissflogii</italic>), while nuclear <italic>petF</italic> gene clustered together in another clade (including <italic>T. oceanica</italic> and <italic>T. rotula</italic>) (<xref ref-type="fig" rid="F7">Figure 7B</xref>), suggesting that the transfer of <italic>petF</italic> gene occurred before the speciation of these <italic>Skeletonema</italic> species.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>The characteristics of <italic>petF</italic> gene among <italic>Skeletonema</italic> species. <bold>(A)</bold> The phylogenetic analysis and genetic structure and <bold>(B)</bold> the alignment of amino acid sequences. Four <italic>Thalassiosira</italic> species are added for comparison. The <italic>petF</italic> genes of <italic>Skeletonema</italic> strains in red are identified from nuclear genome and these in black are identified from cpDNAs.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-774617-g007.tif"/>
</fig>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>Discussion</title>
<p><italic>Skeletonema</italic> species have been attracting extensive attention because they frequently dominate the phytoplankton composition along the coastal regions and play important role in primary production. Members of <italic>Skeletonema</italic> species, such as <italic>S. marinoi</italic>, <italic>S. costatum</italic> and <italic>S. pseudocostatum</italic>, can cause blooms with negative impact on environment. While the cpDNA sequences have been proven to be informative for genetic diversity evaluation, cpDNA of only a single species <italic>S</italic>. <italic>pseudocostatum</italic> has been constructed.</p>
<sec id="S4.SS1">
<title>Conserved cpDNAs and Sequence Divergence Analysis Among <italic>Skeletonema</italic> Species</title>
<p>In this study, we reported cpDNAs of five <italic>Skeletonema</italic> species, <italic>S. marinoi, S. tropicum</italic>, <italic>S. costatum</italic> (with two strains), <italic>S</italic>. <italic>pseudocostatum</italic> and <italic>S. grevillei</italic>, increasing the number of cpDNAs of <italic>Skeletonema</italic> species from one to five. These cpDNAs showed remarkable similarities in sizes (<xref ref-type="table" rid="T1">Table 1</xref>), gene composition, and gene organization (<xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F3">3</xref>). In contrast, cpDNAs of other intra-genus species belonging to the Bacillariophyceae class showed great difference. For example, the cpDNAs of three <italic>Halamphora</italic> species were not conserved, i.e., cpDNAs size (difference up to 28,811 bp), gene order (inversion and translocation), and gene contents (presence/absence of <italic>serC</italic> and <italic>tryC</italic>) (<xref ref-type="bibr" rid="B22">Hamsher et al., 2019</xref>).</p>
<p>Among the previously reported cpDNAs of 55 Bacillariophyta species, the sizes varied greatly, ranging from 111,539 bp (KR709240, <italic>Pseudo-nitzschia multiseries</italic>) to 201,816 bp (MG755792, <italic>Plagiogramma staurophorum</italic>). Comparative analysis of these cpDNAs revealed that the main factors contributing to variation of cpDNAs sizes included expansion or contraction of IR regions, gene loss or gain, presence or absence of introns and the length of ISR (<xref ref-type="bibr" rid="B48">Sabir et al., 2014</xref>; <xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>). The largest cpDNA size of <italic>P. staurophorum</italic> so far discovered was mainly due to the expansion of IR regions (34,888 bp) and a large intron (2971 bp) in <italic>petD</italic> gene (<xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>). During evolution, the IR regions have expanded and contracted under various stress condition. It was found that the large sizes of cpDNAs in the order of Thalassiosirales species were mainly contributed by the large size of IR regions (<xref ref-type="bibr" rid="B48">Sabir et al., 2014</xref>). The sizes of <italic>Skeletonema</italic> cpDNAs were above average among the reported Bacillariophyta cpDNAs and the lengths of IR regions were above 18,000 bp, which were congruent with the previous study (<xref ref-type="bibr" rid="B48">Sabir et al., 2014</xref>).</p>
<p>Loss of genes in the Thalassiosirales order including <italic>petF, petJ, acpP1, ilvB, ilvH, tsf, syfB, serC, syfB</italic>, and <italic>tyrC</italic> from cpDNAs had been previously reported (<xref ref-type="bibr" rid="B47">Ruck et al., 2014</xref>; <xref ref-type="bibr" rid="B48">Sabir et al., 2014</xref>; <xref ref-type="bibr" rid="B65">Yu et al., 2018</xref>). Analysis of cpDNAs of the five <italic>Skeletonema</italic> species confirmed that all of these genes except <italic>petF</italic> were lost from the cpDNAs of these five <italic>Skeletonema</italic> species. The <italic>petF</italic> gene was identified in the cpDNA of all five <italic>Skeletonema</italic> species. The loss of <italic>petF</italic> was found to be caused by the transfer of this gene from chloroplast to nucleus in many species including <italic>T. oceanica</italic>, which may play a role in iron utilization (<xref ref-type="bibr" rid="B41">Lommer et al., 2010</xref>; <xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>). Interestingly, copies of the <italic>petF</italic> genes were also identified in the nuclear genomes of these five <italic>Skeletonema</italic> species (<xref ref-type="fig" rid="F7">Figure 7</xref>), indicating that each of these five <italic>Skeletonema</italic> species harbor at least two copies of <italic>petF</italic>. The nuclear-encoded <italic>petF</italic> genes of five <italic>Skeletonema</italic> species clustered together in the phylogenetic tree and had one intron in each gene structure (<xref ref-type="fig" rid="F7">Figure 7</xref>), suggesting that <italic>petF</italic> gene transfer from cpDNA to nuclear genome took place before the diversification of these <italic>Skeletonema</italic> species, and intron in the nuclear-encoded <italic>petF</italic> gene had already formed in their common ancestor.</p>
<p>Despite of the high synteny and conserved structure among <italic>Skeletonema</italic> cpDNAs, nine regions with enhanced divergences were detected. These regions with enhanced divergences were proved to be suitable as molecular markers for distinguishing <italic>Skeletonema</italic> species.</p>
<p>Simple sequence repeats can be highly variable at the intra-specific level and were often used as genetic markers in the population genetics studies (<xref ref-type="bibr" rid="B32">Kaur et al., 2015</xref>). The SSRs in cpDNAs of the seven <italic>Skeletonema</italic> taxa (including <italic>S. pseudocostatum</italic> of Algerian strain) represented abundant variation, especially for the same species (<italic>S. pseudocostatum</italic>) isolated from different seawaters. Thus, they are useful for detecting genetic polymorphisms among <italic>Skeletonema</italic> species.</p>
</sec>
<sec id="S4.SS2">
<title>Phylogeny and Selection Patterns Within <italic>Skeletonema</italic> cpDNAs</title>
<p>Phylogenetic tree based on the concatenated amino acid sequences of 86 shared cpDNA PCGs of 62 species showed that <italic>Skeletonema</italic> species formed an independent clade (<xref ref-type="fig" rid="F5">Figure 5</xref>). The phylogenetic analysis supported that <italic>S. pseudocostatum</italic> and <italic>S. tropicum</italic> could clustered into sister clade in agreement with the topology in recent studies using 18S rDNA, 28S rDNA, and <italic>cox1</italic> gens (<xref ref-type="bibr" rid="B34">Kooistra et al., 2008</xref>; <xref ref-type="bibr" rid="B63">Yamada et al., 2017</xref>). However, the topologies of the phylogenetic trees were not identical, the tree using the cpDNA PCGs obtained in this study was very similar with the tree based on 28S rDNA (<xref ref-type="bibr" rid="B34">Kooistra et al., 2008</xref>; <xref ref-type="bibr" rid="B63">Yamada et al., 2017</xref>), and was almost identical with the <italic>cox1</italic> tree (except the positions of <italic>S. costatum</italic> and <italic>S. grevillei</italic>) (<xref ref-type="bibr" rid="B40">Liu et al., 2021</xref>), but was different from the tree based on 18S rDNA (<xref ref-type="bibr" rid="B63">Yamada et al., 2017</xref>), confirming that these different genes can have incongruent histories.</p>
<p>Pairwise substitution rate (Ka/Ks) between cpDNAs of <italic>Skeletonema</italic> species was below 1, indicating all the PCGs of cpDNAs were under purifying selection. The purifying selection was also found in similar analysis performed in other species, such as <italic>Dracunculus</italic> (<xref ref-type="bibr" rid="B1">Abdullah et al., 2021</xref>) and <italic>Lagerstroemia</italic> (<xref ref-type="bibr" rid="B62">Xu et al., 2017</xref>).</p>
</sec>
<sec id="S4.SS3">
<title><italic>Skeletonema</italic> Species Divergence Time Estimation Based on cpDNAs</title>
<p>The <italic>Skeletonema</italic> species were nested within the paraphyletic genus <italic>Thalassiosira</italic> as supported by previous studies (<xref ref-type="bibr" rid="B55">Sorhannus, 2007</xref>; <xref ref-type="bibr" rid="B2">Alverson, 2014</xref>; <xref ref-type="bibr" rid="B45">Roy et al., 2020</xref>). The <italic>Skeletonema</italic> species diverged from <italic>Thalassiosira oceanica</italic> (the nearest species in <xref ref-type="fig" rid="F6">Figure 6</xref>) approximately 46 Mya in the Eocene period, which was slightly later than that estimated using two nuclear genes and two plastid genes (about 55 Mya) (<xref ref-type="bibr" rid="B2">Alverson, 2014</xref>). The two HAB species <italic>S. marinoi</italic> and <italic>S. pseudocostatum</italic> diverged approximated 16 Mya (95% HPD 5.66&#x2013;29.85 Mya), which was consistent with results estimated previously using 18S rDNA (about 14 Mya) (<xref ref-type="bibr" rid="B55">Sorhannus, 2007</xref>). The divergence time estimated in this study among <italic>Skeletonema</italic> species was generally similar or slight large than that estimated based on the mtDNA PCGs, indicating the clock rate was similar across the two organelles (<xref ref-type="bibr" rid="B40">Liu et al., 2021</xref>). This study provided the divergence time among the <italic>Skeletonema</italic> species based on the cpDNAs for the first time.</p>
</sec>
</sec>
<sec id="S5" sec-type="conclusion">
<title>Conclusion</title>
<p>In this study, we constructed complete cpDNAs for five <italic>Skeletonema</italic> species (two strains for <italic>S. costatum</italic>), including cpDNAs of four <italic>Skeletonema</italic> species for the first time. Comparative analysis of the cpDNA sizes, structure, gene number and gene arrangement showed high similarity among <italic>Skeletonema</italic> species. Variations of the IR regions among <italic>Skeletonema</italic> cpDNAs was low, suggesting the IR regions were highly conserved for cpDNAs of <italic>Skeletonema</italic> species, compared with those of other genera, such as the genus <italic>Thalassiosira</italic>. Nine regions with enhanced sequence divergence were obtained, which could be used to distinguish <italic>Skeletonema</italic> species. The PCGs of cpDNAs exhibited depressed Ka/Ks ratios, suggesting that their genes had experienced strong purifying selection to eliminate deleterious mutations. Further information from the whole genome data of <italic>Skeletonema</italic> species is needed to explore their ecological adaptability of different seawaters.</p>
</sec>
<sec id="S6" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: The sequencing results (raw data) have been submitted to NCBI and the BioProject number is <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA695365">PRJNA695365</ext-link>. The cpDNAs of six <italic>Skeletonema</italic> strains have been submitted to NCBI and the accession numbers were <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="MW679506">MW679506</ext-link>&#x2013;<ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="MW679511">MW679511</ext-link>.</p>
</sec>
<sec id="S7">
<title>Author Contributions</title>
<p>NC conceived of the study. YZ helped the sampling from the Jiaozhou Bay. SL, KL, and QX performed analysis. SL and NC interpreted the data and wrote the manuscript. All authors contributed to the editing and gave final approval for publication.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="pudiscl1" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec id="S8" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by the Strategic Priority Research Program of Chinese Academy of Sciences (XDB42000000), the Natural Science Foundation of China (41906118), the Chinese Academy of Sciences Pioneer Hundred Talents Program (to NC), the Taishan Scholar Project Special Fund (to NC), the Qingdao Innovation and Creation Plan (Talent Development Program - 5th Annual Pioneer and Innovator Leadership Award to NC, 19-3-2-16-zhc), and the National Key Research and Development Program of China (2017YFC1404300).</p>
</sec>
<ack><p>We are grateful to colleagues from the Jiaozhou Bay Marine Ecosystem Research Station for the opportunity to participate in the investigation expeditions and for their help with field sampling. We are also thankful to the open research cruise (NORC2019-01, NORC2019-03-02, and NORC2019-07) supported by the NSFC shiptime sharing Project (41849901, U1606404, and 41849007).</p>
</ack>
<sec id="S10" sec-type="supplementary-material"><title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2021.774617/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2021.774617/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="DS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Abdullah</surname></name> <name><surname>Henriquez</surname> <given-names>C. L.</given-names></name> <name><surname>Mehmood</surname> <given-names>F.</given-names></name> <name><surname>Hayat</surname> <given-names>A.</given-names></name> <name><surname>Sammad</surname> <given-names>A.</given-names></name> <name><surname>Waseem</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Chloroplast genome evolution in the Dracunculus clade (Aroideae, Araceae).</article-title> <source><italic>Genomics</italic></source> <volume>113</volume> <fpage>183</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2020.12.016</pub-id> <pub-id pub-id-type="pmid">33326831</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alverson</surname> <given-names>A. J.</given-names></name></person-group> (<year>2014</year>). <article-title>Timing marine&#x2013;freshwater transitions in the diatom order Thalassiosirales.</article-title> <source><italic>Paleobiology</italic></source> <volume>40</volume> <fpage>91</fpage>&#x2013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1666/12055</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armbrust</surname> <given-names>E. V.</given-names></name></person-group> (<year>2009</year>). <article-title>The life of diatoms in the world&#x2019;s oceans.</article-title> <source><italic>Nature</italic></source> <volume>459</volume> <fpage>185</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1038/nature08057</pub-id> <pub-id pub-id-type="pmid">19444204</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Armbrust</surname> <given-names>E. V.</given-names></name> <name><surname>Berges</surname> <given-names>J. A.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Green</surname> <given-names>B. R.</given-names></name> <name><surname>Martinez</surname> <given-names>D.</given-names></name> <name><surname>Putnam</surname> <given-names>N. H.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>The genome of the diatom thalassiosira pseudonana: ecology, evolution, and metabolism.</article-title> <source><italic>Science</italic></source> <volume>306</volume> <fpage>79</fpage>&#x2013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.1126/science.1101156</pub-id> <pub-id pub-id-type="pmid">15459382</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bankevich</surname> <given-names>A.</given-names></name> <name><surname>Nurk</surname> <given-names>S.</given-names></name> <name><surname>Antipov</surname> <given-names>D.</given-names></name> <name><surname>Gurevich</surname> <given-names>A. A.</given-names></name> <name><surname>Dvorkin</surname> <given-names>M.</given-names></name> <name><surname>Kulikov</surname> <given-names>A. S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing.</article-title> <source><italic>J. Comput. Biol.</italic></source> <volume>19</volume> <fpage>455</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2012.0021</pub-id> <pub-id pub-id-type="pmid">22506599</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beier</surname> <given-names>S.</given-names></name> <name><surname>Thiel</surname> <given-names>T.</given-names></name> <name><surname>M&#x00FC;nch</surname> <given-names>T.</given-names></name> <name><surname>Scholz</surname> <given-names>U.</given-names></name> <name><surname>Mascher</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>MISA-web: a web server for microsatellite prediction.</article-title> <source><italic>Bioinformatics</italic></source> <volume>33</volume> <fpage>2583</fpage>&#x2013;<lpage>2585</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx198</pub-id> <pub-id pub-id-type="pmid">28398459</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Capella-Gutierrez</surname> <given-names>S.</given-names></name> <name><surname>Silla-Martinez</surname> <given-names>J.</given-names></name> <name><surname>Gabaldon</surname> <given-names>T.</given-names></name></person-group> (<year>2009</year>). <article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1972</fpage>&#x2013;<lpage>1973</lpage>.</citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>Z.</given-names></name> <name><surname>Xu</surname> <given-names>Q.</given-names></name> <name><surname>Gibson</surname> <given-names>K.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>N.</given-names></name></person-group> (<year>2021</year>). <article-title>Metabarcoding analysis of harmful algal bloom species in the Changjiang Estuary, China.</article-title> <source><italic>Sci. Total Environ.</italic></source> <volume>782</volume>:<issue>146823</issue>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2021.146823</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Darling</surname> <given-names>A.</given-names></name> <name><surname>Mau</surname> <given-names>B.</given-names></name> <name><surname>Perna</surname> <given-names>N.</given-names></name></person-group> (<year>2010</year>). <article-title>progressiveMauve: multiple genome alignment with gene gain, loss and rearrangement.</article-title> <source><italic>Plos One</italic></source> <volume>5</volume>:<issue>e11147</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0011147</pub-id> <pub-id pub-id-type="pmid">20593022</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>David</surname> <given-names>W.</given-names></name></person-group> (<year>2020</year>). <source><italic>gggenes: Draw Gene Arrow Maps in &#x2018;ggplot2&#x2019;. R package version 0.4.1.</italic></source></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frazer</surname> <given-names>K.</given-names></name> <name><surname>Pachter</surname> <given-names>L.</given-names></name> <name><surname>Poliakov</surname> <given-names>A.</given-names></name> <name><surname>Rubin</surname> <given-names>E.</given-names></name> <name><surname>Dubchak</surname> <given-names>I.</given-names></name></person-group> (<year>2004</year>). <article-title>VISTA: computational tools for comparative genomics.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>W273</fpage>&#x2013;<lpage>W279</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh458</pub-id> <pub-id pub-id-type="pmid">15215394</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Garg</surname> <given-names>S. G.</given-names></name> <name><surname>Gould</surname> <given-names>S. B.</given-names></name></person-group> (<year>2016</year>). <article-title>The role of charge in protein targeting evolution.</article-title> <source><italic>Trends Cell Biol.</italic></source> <volume>26</volume> <fpage>894</fpage>&#x2013;<lpage>905</lpage>. <pub-id pub-id-type="doi">10.1016/j.tcb.2016.07.001</pub-id> <pub-id pub-id-type="pmid">27524662</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><collab>GeneWise</collab> (<year>2008</year>). <source><italic>GeneWise in Encyclopedia of Genetics, Genomics, Proteomics and Informatics.</italic></source> <publisher-loc>Dordrecht</publisher-loc>: <publisher-name>Springer</publisher-name>, <fpage>783</fpage>&#x2013;<lpage>783</lpage>.</citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Godhe</surname> <given-names>A.</given-names></name> <name><surname>McQuoid</surname> <given-names>M. R.</given-names></name> <name><surname>Karunasagar</surname> <given-names>I.</given-names></name> <name><surname>Karunasagar</surname> <given-names>I.</given-names></name> <name><surname>Rehnstam-Holm</surname> <given-names>A. S.</given-names></name></person-group> (<year>2006</year>). <article-title>Comparison of three common molecular tools for distinguishing among geographically separated clones of the diatom Skeletonema marinoi Sarno et Zingone (bacillariophyceae).</article-title> <source><italic>J. Phycol.</italic></source> <volume>42</volume> <fpage>280</fpage>&#x2013;<lpage>291</lpage>. <pub-id pub-id-type="doi">10.1111/j.1529-8817.2006.00197.x</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gould</surname> <given-names>S. B.</given-names></name> <name><surname>Waller</surname> <given-names>R. F.</given-names></name> <name><surname>McFadden</surname> <given-names>G. I.</given-names></name></person-group> (<year>2008</year>). <article-title>Plastid evolution.</article-title> <source><italic>Annu. Rev. Plant Biol.</italic></source> <volume>59</volume> <fpage>491</fpage>&#x2013;<lpage>517</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.arplant.59.032607.092915</pub-id> <pub-id pub-id-type="pmid">18315522</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Greiner</surname> <given-names>S.</given-names></name> <name><surname>Lehwark</surname> <given-names>P.</given-names></name> <name><surname>Bock</surname> <given-names>R.</given-names></name></person-group> (<year>2019</year>). <article-title>OrganellarGenomeDRAW (OGDRAW) version 1.3.1: expanded toolkit for the graphical visualization of organellar genomes.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>47</volume> <fpage>W59</fpage>&#x2013;<lpage>W64</lpage>.</citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guillard</surname> <given-names>R. R. L.</given-names></name> <name><surname>Hargraves</surname> <given-names>P. E.</given-names></name></person-group> (<year>1993</year>). <article-title>Stichochrysis immobilis is a diatom, not a chrysophyte.</article-title> <source><italic>Phycologia</italic></source> <volume>32</volume> <fpage>234</fpage>&#x2013;<lpage>236</lpage>. <pub-id pub-id-type="doi">10.2216/i0031-8884-32-3-234.1</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guiry</surname> <given-names>M. D.</given-names></name> <name><surname>Guiry</surname> <given-names>G. M.</given-names></name></person-group> (<year>2021</year>). <source><italic>AlgaeBase.</italic></source> <publisher-loc>Galway</publisher-loc>: <publisher-name>National University of Ireland</publisher-name>.</citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haernstroem</surname> <given-names>K.</given-names></name> <name><surname>Ellegaard</surname> <given-names>M.</given-names></name> <name><surname>Andersen</surname> <given-names>T. J.</given-names></name> <name><surname>Godhe</surname> <given-names>A.</given-names></name></person-group> (<year>2011</year>). <article-title>Hundred years of genetic structure in a sediment revived diatom population.</article-title> <source><italic>Proc. Nat. Acad. Sci. USA</italic></source> <volume>108</volume> <fpage>4252</fpage>&#x2013;<lpage>4257</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1013528108</pub-id> <pub-id pub-id-type="pmid">21282612</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Halliwell</surname> <given-names>B.</given-names></name></person-group> (<year>1984</year>). <source><italic>Chloroplast metabolism: The structure and function of chloroplasts in green leaf cells.</italic></source> <publisher-loc>Oxford</publisher-loc>: <publisher-name>Oxford University Press</publisher-name>.</citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hamedi</surname> <given-names>C.</given-names></name> <name><surname>Gastineau</surname> <given-names>R.</given-names></name> <name><surname>Lemieux</surname> <given-names>C.</given-names></name> <name><surname>Turmel</surname> <given-names>M.</given-names></name> <name><surname>Witkowski</surname> <given-names>A.</given-names></name> <name><surname>Baba Hamed</surname> <given-names>M. B.</given-names></name></person-group> (<year>2019</year>). <article-title>Complete chloroplast genome of the diatom Skeletonema pseudocostatum from the western mediterranean coast of algeria.</article-title> <source><italic>Mitochondrial DNA Part B</italic></source> <volume>4</volume> <fpage>1091</fpage>&#x2013;<lpage>1092</lpage>. <pub-id pub-id-type="doi">10.1080/23802359.2019.1586481</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hamsher</surname> <given-names>S. E.</given-names></name> <name><surname>Keepers</surname> <given-names>K. G.</given-names></name> <name><surname>Pogoda</surname> <given-names>C. S.</given-names></name> <name><surname>Stepanek</surname> <given-names>J. G.</given-names></name> <name><surname>Kane</surname> <given-names>N. C.</given-names></name> <name><surname>Kociolek</surname> <given-names>J. P.</given-names></name></person-group> (<year>2019</year>). <article-title>Extensive chloroplast genome rearrangement amongst three closely related Halamphora spp. (Bacillariophyceae), and evidence for rapid evolution as compared to land plants.</article-title> <source><italic>PLoS One</italic></source> <volume>14</volume>:<issue>e0217824</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0217824</pub-id> <pub-id pub-id-type="pmid">31269054</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hemaiswarya</surname> <given-names>S.</given-names></name> <name><surname>Raja</surname> <given-names>R.</given-names></name> <name><surname>Kumar</surname> <given-names>R. R.</given-names></name> <name><surname>Ganesan</surname> <given-names>V.</given-names></name> <name><surname>Anbazhagan</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>Microalgae: a sustainable feed source for aquaculture.</article-title> <source><italic>World J. Microbiol. Biotechnol.</italic></source> <volume>27</volume> <fpage>1737</fpage>&#x2013;<lpage>1746</lpage>. <pub-id pub-id-type="doi">10.1007/s11274-010-0632-z</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>B.</given-names></name> <name><surname>Jin</surname> <given-names>J.</given-names></name> <name><surname>Guo</surname> <given-names>A.-Y.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Luo</surname> <given-names>J.</given-names></name> <name><surname>Gao</surname> <given-names>G.</given-names></name></person-group> (<year>2015</year>). <article-title>GSDS 2.0: an upgraded gene feature visualization server.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>1296</fpage>&#x2013;<lpage>1297</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu817</pub-id> <pub-id pub-id-type="pmid">25504850</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jackman</surname> <given-names>S. D.</given-names></name> <name><surname>Vandervalk</surname> <given-names>B. P.</given-names></name> <name><surname>Mohamadi</surname> <given-names>H.</given-names></name> <name><surname>Chu</surname> <given-names>J.</given-names></name> <name><surname>Yeo</surname> <given-names>S.</given-names></name> <name><surname>Hammond</surname> <given-names>S. A.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>ABySS 2.0: resource-efficient assembly of large genomes using a Bloom filter.</article-title> <source><italic>Genome Res.</italic></source> <volume>27</volume> <fpage>768</fpage>&#x2013;<lpage>777</lpage>. <pub-id pub-id-type="doi">10.1101/gr.214346.116</pub-id> <pub-id pub-id-type="pmid">28232478</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jin</surname> <given-names>J.-J.</given-names></name> <name><surname>Yu</surname> <given-names>W.-B.</given-names></name> <name><surname>Yang</surname> <given-names>J.-B.</given-names></name> <name><surname>Song</surname> <given-names>Y.</given-names></name> <name><surname>dePamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Yi</surname> <given-names>T.-S.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>GetOrganelle: a fast and versatile toolkit for accurate de novo assembly of organelle genomes.</article-title> <source><italic>Genome Biol.</italic></source> <volume>21</volume>:<issue>21545</issue>. <pub-id pub-id-type="doi">10.1186/s13059-020-02154-5</pub-id> <pub-id pub-id-type="pmid">32912315</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johansson</surname> <given-names>O. N.</given-names></name> <name><surname>T&#x00F6;pel</surname> <given-names>M.</given-names></name> <name><surname>Pinder</surname> <given-names>M. I. M.</given-names></name> <name><surname>Kourtchenko</surname> <given-names>O.</given-names></name> <name><surname>Blomberg</surname> <given-names>A.</given-names></name> <name><surname>Godhe</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Skeletonema marinoi as a new genetic model for marine chain-forming diatoms.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>9</volume>:<issue>5391</issue>. <pub-id pub-id-type="doi">10.1038/s41598-019-41085-5</pub-id> <pub-id pub-id-type="pmid">30940823</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kajitani</surname> <given-names>R.</given-names></name> <name><surname>Yoshimura</surname> <given-names>D.</given-names></name> <name><surname>Okuno</surname> <given-names>M.</given-names></name> <name><surname>Minakuchi</surname> <given-names>Y.</given-names></name> <name><surname>Kagoshima</surname> <given-names>H.</given-names></name> <name><surname>Fujiyama</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Platanus-allee is a de novo haplotype assembler enabling a comprehensive access to divergent heterozygous regions.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>10</volume>:<issue>1702</issue>. <pub-id pub-id-type="doi">10.1038/s41467-019-09575-2</pub-id> <pub-id pub-id-type="pmid">30979905</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kalyaanamoorthy</surname> <given-names>S.</given-names></name> <name><surname>Minh</surname> <given-names>B. Q.</given-names></name> <name><surname>Wong</surname> <given-names>T. K. F.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name> <name><surname>Jermiin</surname> <given-names>L. S.</given-names></name></person-group> (<year>2017</year>). <article-title>ModelFinder: fast model selection for accurate phylogenetic estimates.</article-title> <source><italic>Nat. Methods</italic></source> <volume>14</volume> <fpage>587</fpage>&#x2013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id> <pub-id pub-id-type="pmid">28481363</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kassambara</surname> <given-names>A.</given-names></name></person-group> (<year>2020</year>). <source><italic>ggpubr: &#x2018;ggplot2&#x2019; Based Publication Ready Plots. R package version 0.4.0.</italic></source></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K.</given-names></name> <name><surname>Standley</surname> <given-names>D.</given-names></name></person-group> (<year>2013</year>). <article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>30</volume> <fpage>772</fpage>&#x2013;<lpage>780</lpage>.</citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaur</surname> <given-names>S.</given-names></name> <name><surname>Panesar</surname> <given-names>P. S.</given-names></name> <name><surname>Bera</surname> <given-names>M. B.</given-names></name> <name><surname>Kaur</surname> <given-names>V.</given-names></name></person-group> (<year>2015</year>). <article-title>Simple sequence repeat markers in genetic divergence and marker-assisted selection of rice cultivars: a review.</article-title> <source><italic>Crit. Rev. Food Sci. Nutr.</italic></source> <volume>55</volume> <fpage>41</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1080/10408398.2011.646363</pub-id> <pub-id pub-id-type="pmid">24915404</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>S.-C.</given-names></name> <name><surname>Lee</surname> <given-names>J.-W.</given-names></name> <name><surname>Choi</surname> <given-names>B.-K.</given-names></name></person-group> (<year>2021</year>). <article-title>Seven complete chloroplast genomes from symplocos: genome organization and comparative analysis.</article-title> <source><italic>Forests</italic></source> <volume>12</volume>:<issue>608</issue>.</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kooistra</surname> <given-names>W.</given-names></name> <name><surname>Sarno</surname> <given-names>D.</given-names></name> <name><surname>Balzano</surname> <given-names>S.</given-names></name> <name><surname>Gu</surname> <given-names>H. F.</given-names></name> <name><surname>Andersen</surname> <given-names>R. A.</given-names></name> <name><surname>Zingone</surname> <given-names>A.</given-names></name></person-group> (<year>2008</year>). <article-title>Global diversity and biogeography of Skeletonema species (Bacillariophyta).</article-title> <source><italic>Protist</italic></source> <volume>159</volume> <fpage>177</fpage>&#x2013;<lpage>193</lpage>. <pub-id pub-id-type="doi">10.1016/j.protis.2007.09.004</pub-id> <pub-id pub-id-type="pmid">18042429</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>S.</given-names></name> <name><surname>Stecher</surname> <given-names>G.</given-names></name> <name><surname>Li</surname> <given-names>M.</given-names></name> <name><surname>Knyaz</surname> <given-names>C.</given-names></name> <name><surname>Tamura</surname> <given-names>K.</given-names></name></person-group> (<year>2018</year>). <article-title>MEGA X: molecular evolutionary genetics analysis across computing platforms.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>35</volume> <fpage>1547</fpage>&#x2013;<lpage>1549</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msy096</pub-id> <pub-id pub-id-type="pmid">29722887</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Durbin</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Fast and accurate short read alignment with Burrows-Wheeler transform.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1754</fpage>&#x2013;<lpage>1760</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id> <pub-id pub-id-type="pmid">19451168</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Handsaker</surname> <given-names>B.</given-names></name> <name><surname>Wysoker</surname> <given-names>A.</given-names></name> <name><surname>Fennell</surname> <given-names>T.</given-names></name> <name><surname>Ruan</surname> <given-names>J.</given-names></name> <name><surname>Homer</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The Sequence Alignment/Map format and SAMtools.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id> <pub-id pub-id-type="pmid">19505943</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>F.</given-names></name> <name><surname>Pang</surname> <given-names>S.</given-names></name></person-group> (<year>2016</year>). <article-title>Chloroplast genome of Sargassum horneri (Sargassaceae, Phaeophyceae): comparative chloroplast genomics of brown algae.</article-title> <source><italic>J. Appl. Phycol.</italic></source> <volume>28</volume> <fpage>1419</fpage>&#x2013;<lpage>1426</lpage>. <pub-id pub-id-type="doi">10.1007/s10811-015-0609-2</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Gibson</surname> <given-names>K.</given-names></name> <name><surname>Cui</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Sun</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>N.</given-names></name></person-group> (<year>2020</year>). <article-title>Metabarcoding analysis of harmful algal species in Jiaozhou Bay.</article-title> <source><italic>Harmful Algae</italic></source> <volume>92</volume>:<issue>101772</issue>. <pub-id pub-id-type="doi">10.1016/j.hal.2020.101772</pub-id> <pub-id pub-id-type="pmid">32113606</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>Q.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name> <name><surname>Chen</surname> <given-names>N.</given-names></name></person-group> (<year>2021</year>). <article-title>Comparative analysis of full-length mitochondrial genomes of five Skeletonema species reveals conserved genome organization and recent speciation.</article-title> <source><italic>BMC Genomics</italic></source> <volume>22</volume>:<issue>7999</issue>. <pub-id pub-id-type="doi">10.1186/s12864-021-07999-z</pub-id> <pub-id pub-id-type="pmid">34654361</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lommer</surname> <given-names>M.</given-names></name> <name><surname>Roy</surname> <given-names>A.-S.</given-names></name> <name><surname>Schilhabel</surname> <given-names>M.</given-names></name> <name><surname>Schreiber</surname> <given-names>S.</given-names></name> <name><surname>Rosenstiel</surname> <given-names>P.</given-names></name> <name><surname>LaRoche</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). <article-title>Recent transfer of an iron-regulated gene from the plastid to the nuclear genome in an oceanic diatom adapted to chronic iron limitation.</article-title> <source><italic>BMC Genomics</italic></source> <volume>11</volume>:<issue>718</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-11-718</pub-id> <pub-id pub-id-type="pmid">21171997</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Malviya</surname> <given-names>S.</given-names></name> <name><surname>Scalco</surname> <given-names>E.</given-names></name> <name><surname>Audic</surname> <given-names>S.</given-names></name> <name><surname>Vincent</surname> <given-names>F.</given-names></name> <name><surname>Veluchamy</surname> <given-names>A.</given-names></name> <name><surname>Poulain</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Insights into global diatom distribution and diversity in the world&#x2019;s ocean.</article-title> <source><italic>PNAS</italic></source> <volume>2016</volume> <fpage>E1516</fpage>&#x2013;<lpage>E1525</lpage>.</citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mohamed</surname> <given-names>Z. A.</given-names></name></person-group> (<year>2018</year>). <article-title>Potentially harmful microalgae and algal blooms in the Red Sea: Current knowledge and research needs.</article-title> <source><italic>Marine Environ. Res.</italic></source> <volume>140</volume> <fpage>234</fpage>&#x2013;<lpage>242</lpage>. <pub-id pub-id-type="doi">10.1016/j.marenvres.2018.06.019</pub-id> <pub-id pub-id-type="pmid">29970250</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nakov</surname> <given-names>T.</given-names></name> <name><surname>Beaulieu</surname> <given-names>J. M.</given-names></name> <name><surname>Alverson</surname> <given-names>A. J.</given-names></name></person-group> (<year>2018</year>). <article-title>Accelerated diversification is related to life history and locomotion in a hyperdiverse lineage of microbial eukaryotes (Diatoms, Bacillariophyta).</article-title> <source><italic>New Phytol.</italic></source> <volume>219</volume> <fpage>462</fpage>&#x2013;<lpage>473</lpage>. <pub-id pub-id-type="doi">10.1111/nph.15137</pub-id> <pub-id pub-id-type="pmid">29624698</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roy</surname> <given-names>A. S.</given-names></name> <name><surname>Woehle</surname> <given-names>C.</given-names></name> <name><surname>LaRoche</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>The transfer of the ferredoxin gene from the chloroplast to the nuclear genome is ancient within the paraphyletic genus thalassiosira.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>11</volume>:<issue>523689</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2020.523689</pub-id> <pub-id pub-id-type="pmid">33123095</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rozas</surname> <given-names>J.</given-names></name> <name><surname>Ferrer-Mata</surname> <given-names>A.</given-names></name> <name><surname>S&#x00E1;nchez-DelBarrio</surname> <given-names>J. C.</given-names></name> <name><surname>Guirao-Rico</surname> <given-names>S.</given-names></name> <name><surname>Librado</surname> <given-names>P.</given-names></name> <name><surname>Ramos-Onsins</surname> <given-names>S. E.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>DnaSP 6: DNA sequence polymorphism analysis of large datasets.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>34</volume> <fpage>3299</fpage>&#x2013;<lpage>3302</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx248</pub-id> <pub-id pub-id-type="pmid">29029172</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ruck</surname> <given-names>E. C.</given-names></name> <name><surname>Nakov</surname> <given-names>T.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Theriot</surname> <given-names>E. C.</given-names></name> <name><surname>Alverson</surname> <given-names>A. J.</given-names></name></person-group> (<year>2014</year>). <article-title>Serial gene losses and foreign DNA underlie size and sequence variation in the plastid genomes of diatoms.</article-title> <source><italic>Genome Biol. Evol.</italic></source> <volume>6</volume> <fpage>644</fpage>&#x2013;<lpage>654</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evu039</pub-id> <pub-id pub-id-type="pmid">24567305</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sabir</surname> <given-names>J. S.</given-names></name> <name><surname>Yu</surname> <given-names>M.</given-names></name> <name><surname>Ashworth</surname> <given-names>M. P.</given-names></name> <name><surname>Baeshen</surname> <given-names>N. A.</given-names></name> <name><surname>Baeshen</surname> <given-names>M. N.</given-names></name> <name><surname>Bahieldin</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Conserved gene order and expanded inverted repeats characterize plastid genomes of Thalassiosirales.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e107854</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0107854</pub-id> <pub-id pub-id-type="pmid">25233465</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sarno</surname> <given-names>D.</given-names></name> <name><surname>Kooistra</surname> <given-names>W. H. C. F.</given-names></name> <name><surname>Medlin</surname> <given-names>L. K.</given-names></name> <name><surname>Percopo</surname> <given-names>I.</given-names></name> <name><surname>Zingone</surname> <given-names>A.</given-names></name></person-group> (<year>2005</year>). <article-title>Diversity in the genusskeletonema(bacillariophyceae). ii. an assessment of the taxonomy ofs. costatum-like species with the description of four new species.</article-title> <source><italic>J. Phycol.</italic></source> <volume>41</volume> <fpage>151</fpage>&#x2013;<lpage>176</lpage>. <pub-id pub-id-type="doi">10.1111/j.1529-8817.2005.04067.x</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sarno</surname> <given-names>D.</given-names></name> <name><surname>Kooistra</surname> <given-names>W.</given-names></name> <name><surname>Balzano</surname> <given-names>S.</given-names></name> <name><surname>Hargraves</surname> <given-names>P. E.</given-names></name> <name><surname>Zingone</surname> <given-names>A.</given-names></name></person-group> (<year>2007</year>). <article-title>Diversity in the genus Skeletonema (Bacillariophyceae): III. Phylogenetic position and morphological variability of Skeletonema costatum and Skeletonema grevillei, with the description of Skeletonema ardens sp nov.</article-title> <source><italic>J. Phycol.</italic></source> <volume>43</volume> <fpage>156</fpage>&#x2013;<lpage>170</lpage>. <pub-id pub-id-type="doi">10.1111/j.1529-8817.2006.00305.x</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shuya</surname> <given-names>L.</given-names></name> <name><surname>Nansheng</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <article-title>Advances in biodiversity analysis of phytoplankton and harmful algal bloom species in the Jiaozhou Bay (with English abstract).</article-title> <source><italic>Marine Sci.</italic></source> <volume>45</volume> <fpage>170</fpage>&#x2013;<lpage>188</lpage>.</citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>V. K.</given-names></name> <name><surname>Mangalam</surname> <given-names>A. K.</given-names></name> <name><surname>Dwivedi</surname> <given-names>S.</given-names></name> <name><surname>Naik</surname> <given-names>S.</given-names></name></person-group> (<year>1998</year>). <article-title>Primer premier: Program for design of degenerate primers from a protein sequence.</article-title> <source><italic>Biotechniques</italic></source> <volume>24</volume> <fpage>318</fpage>&#x2013;<lpage>319</lpage>. <pub-id pub-id-type="doi">10.2144/98242pf02</pub-id> <pub-id pub-id-type="pmid">9494736</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>S.</given-names></name> <name><surname>Dunn</surname> <given-names>C.</given-names></name></person-group> (<year>2008</year>). <article-title>Phyutility: a phyloinformatics tool for trees, alignments and molecular data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>24</volume> <fpage>715</fpage>&#x2013;<lpage>716</lpage>.</citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>H.</given-names></name> <name><surname>Liu</surname> <given-names>F.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Xu</surname> <given-names>Q.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Yu</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Development of a high-resolution molecular marker for tracking Phaeocystis globosa genetic diversity through comparative analysis of chloroplast genomes.</article-title> <source><italic>Harmful Algae</italic></source> <volume>99</volume>:<issue>101911</issue>. <pub-id pub-id-type="doi">10.1016/j.hal.2020.101911</pub-id> <pub-id pub-id-type="pmid">33218437</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sorhannus</surname> <given-names>U.</given-names></name></person-group> (<year>2007</year>). <article-title>A nuclear-encoded small-subunit ribosomal RNA timescale for diatom evolution.</article-title> <source><italic>Marine Micropaleontol.</italic></source> <volume>65</volume> <fpage>1</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1016/j.marmicro.2007.05.002</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Strzepek</surname> <given-names>R. F.</given-names></name> <name><surname>Harrison</surname> <given-names>P. J.</given-names></name></person-group> (<year>2004</year>). <article-title>Photosynthetic architecture differs in coastal and oceanic diatoms.</article-title> <source><italic>Nature</italic></source> <volume>431</volume> <fpage>689</fpage>&#x2013;<lpage>692</lpage>. <pub-id pub-id-type="doi">10.1038/nature02954</pub-id> <pub-id pub-id-type="pmid">15470428</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thorvaldsdottir</surname> <given-names>H.</given-names></name> <name><surname>Robinson</surname> <given-names>J. T.</given-names></name> <name><surname>Mesirov</surname> <given-names>J. P.</given-names></name></person-group> (<year>2013</year>). <article-title>Integrative Genomics Viewer (IGV): high-performance genomics data visualization and exploration.</article-title> <source><italic>Brief. Bioinform.</italic></source> <volume>14</volume> <fpage>178</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbs017</pub-id> <pub-id pub-id-type="pmid">22517427</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tillich</surname> <given-names>M.</given-names></name> <name><surname>Lehwark</surname> <given-names>P.</given-names></name> <name><surname>Pellizzer</surname> <given-names>T.</given-names></name> <name><surname>Ulbricht-Jones</surname> <given-names>E.</given-names></name> <name><surname>Fischer</surname> <given-names>A.</given-names></name> <name><surname>Bock</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>GeSeq &#x2013; versatile and accurate annotation of organelle genomes.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>45</volume> <fpage>W6</fpage>&#x2013;<lpage>W11</lpage>.</citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trifinopoulos</surname> <given-names>J.</given-names></name> <name><surname>Nguyen</surname> <given-names>L. T.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name> <name><surname>Minh</surname> <given-names>B. Q.</given-names></name></person-group> (<year>2016</year>). <article-title>W-IQ-TREE: a fast online phylogenetic tool for maximum likelihood analysis.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <fpage>W232</fpage>&#x2013;<lpage>W235</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw256</pub-id> <pub-id pub-id-type="pmid">27084950</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Zhu</surname> <given-names>J.</given-names></name> <name><surname>Yu</surname> <given-names>J.</given-names></name></person-group> (<year>2010</year>). <article-title>KaKs_Calculator 2.0: a toolkit incorporating gamma-series methods and sliding window strategies.</article-title> <source><italic>Genomics Proteomics Bioinform.</italic></source> <volume>8</volume> <fpage>77</fpage>&#x2013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1016/S1672-0229(10)60008-3</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>F.</given-names></name> <name><surname>Chen</surname> <given-names>N.</given-names></name></person-group> (<year>2021</year>). <article-title>Mitochondrial genome of the harmful algal bloom species Odontella regia (Mediophyceae, Bacillariophyta).</article-title> <source><italic>J. Appl. Phycol.</italic></source> <volume>2021</volume>:<issue>23641</issue>. <pub-id pub-id-type="doi">10.1007/s10811-020-02364-1</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>C.</given-names></name> <name><surname>Dong</surname> <given-names>W.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Lu</surname> <given-names>Y.</given-names></name> <name><surname>Xie</surname> <given-names>X.</given-names></name> <name><surname>Jin</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Comparative analysis of six lagerstroemia complete chloroplast genomes.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>8</volume>:<issue>15</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2017.00015</pub-id> <pub-id pub-id-type="pmid">28154574</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yamada</surname> <given-names>M.</given-names></name> <name><surname>Otsubo</surname> <given-names>M.</given-names></name> <name><surname>Tsutsumi</surname> <given-names>Y.</given-names></name> <name><surname>Mizota</surname> <given-names>C.</given-names></name> <name><surname>Nakamura</surname> <given-names>Y.</given-names></name> <name><surname>Takahashi</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Utility of mitochondrial-encoded cytochrome c oxidase I gene for phylogenetic analysis and species identification of the planktonic diatom genus <italic>Skeletonema</italic>.</article-title> <source><italic>Phycol. Res.</italic></source> <volume>65</volume> <fpage>217</fpage>&#x2013;<lpage>225</lpage>. <pub-id pub-id-type="doi">10.1111/pre.12179</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Z. H.</given-names></name></person-group> (<year>2007</year>). <article-title>PAML 4: Phylogenetic analysis by maximum likelihood.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>24</volume> <fpage>1586</fpage>&#x2013;<lpage>1591</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msm088</pub-id> <pub-id pub-id-type="pmid">17483113</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>M.</given-names></name> <name><surname>Ashworth</surname> <given-names>M. P.</given-names></name> <name><surname>Hajrah</surname> <given-names>N. H.</given-names></name> <name><surname>Khiyami</surname> <given-names>M. A.</given-names></name> <name><surname>Sabir</surname> <given-names>M. J.</given-names></name> <name><surname>Alhebshi</surname> <given-names>A. M.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Evolution of the plastid genomes in diatoms.</article-title> <source><italic>Plastid. Genome Evol.</italic></source> <volume>85</volume> <fpage>129</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.1016/bs.abr.2017.11.009</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>D.</given-names></name> <name><surname>Gao</surname> <given-names>F.</given-names></name> <name><surname>Jakovlic</surname> <given-names>I.</given-names></name> <name><surname>Zou</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>W. X.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>PhyloSuite: An integrated and scalable desktop platform for streamlined molecular sequence data management and evolutionary phylogenetics studies.</article-title> <source><italic>Mol. Ecol. Res.</italic></source> <volume>20</volume> <fpage>348</fpage>&#x2013;<lpage>355</lpage>. <pub-id pub-id-type="doi">10.1111/1755-0998.13096</pub-id> <pub-id pub-id-type="pmid">31599058</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/BFL-lab/Mfannot">https://github.com/BFL-lab/Mfannot</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/orffinder/">https://www.ncbi.nlm.nih.gov/orffinder/</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="http://tree.bio.ed.ac.uk/software/figtree/">http://tree.bio.ed.ac.uk/software/figtree/</ext-link></p></fn>
<fn id="footnote4">
<label>4</label>
<p><ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/Tools/psa/genewise/">https://www.ebi.ac.uk/Tools/psa/genewise/</ext-link></p></fn>
</fn-group>
</back>
</article>