<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fgene.2021.635043</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>PacBio Single-Molecule Long-Read Sequencing Reveals Genes Tolerating Manganese Stress in <italic>Schima superba</italic> Saplings</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Liaquat</surname> <given-names>Fiza</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1162982/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Munis</surname> <given-names>Muhammad Farooq Hussain</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Arif</surname> <given-names>Samiah</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Haroon</surname> <given-names>Urooj</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Shi</surname> <given-names>Jianxin</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Saqib</surname> <given-names>Saddam</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zaman</surname> <given-names>Wajid</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1025463/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Che</surname> <given-names>Shengquan</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Liu</surname> <given-names>Qunlu</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1153743/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Agriculture and Biology, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Plant Sciences, Faculty of Biological Sciences, Quaid-i-Azam University</institution>, <addr-line>Islamabad</addr-line>, <country>Pakistan</country></aff>
<aff id="aff3"><sup>3</sup><institution>Joint International Research Laboratory of Metabolic and Developmental Sciences, School of Life Sciences and Biotechnology, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>State Key Laboratory of Systematic and Evolutionary Botany, Institute of Botany, Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>University of Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>Department of Landscape Architecture, School of Design, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Reyazul Rouf Mir, Sher-e-Kashmir University of Agricultural Sciences and Technology, India</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Jianguo Gao, Peking University, China; Sunera Khan, Abdul Wali Khan University Mardan, Pakistan; Muhammad Aaqil Khan, Kyungpook National University, South Korea</p></fn>
<corresp id="c001">&#x002A;Correspondence: Qunlu Liu, <email>liuql@sjtu.edu.cn</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Plant Genomics, a section of the journal Frontiers in Genetics</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>06</day>
<month>04</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>635043</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>11</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>01</day>
<month>03</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Liaquat, Munis, Arif, Haroon, Shi, Saqib, Zaman, Che and Liu.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Liaquat, Munis, Arif, Haroon, Shi, Saqib, Zaman, Che and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p><italic>Schima superba</italic> (Theaceae) is a subtropical evergreen tree and is used widely for forest firebreaks and gardening. It is a plant that tolerates salt and typically accumulates elevated amounts of manganese in the leaves. With large ecological amplitude, this tree species grows quickly. Due to its substantial biomass, it has a great potential for soil remediation. To evaluate the thorough framework of the mRNA, we employed PacBio sequencing technology for the first time to generate <italic>S. Superba</italic> transcriptome. In this analysis, overall, 511,759 full length non-chimeric reads were acquired, and 163,834 high-quality full-length reads were obtained. Overall, 93,362 open reading frames were obtained, of which 78,255 were complete. In gene annotation analyses, the Kyoto Encyclopedia of Genes and Genomes (KEGG), Clusters of Orthologous Genes (COG), Gene Ontology (GO), and Non-Redundant (Nr) databases were allocated 91,082, 71,839, 38,914, and 38,376 transcripts, respectively. To identify long non-coding RNAs (lncRNAs), we utilized four computational methods associated with protein families (Pfam), Cooperative Data Classification (CPC), Coding Assessing Potential Tool (CPAT), and Coding Non-Coding Index (CNCI) databases and observed 8,551, 9,174, 20,720, and 18,669 lncRNAs, respectively. Moreover, nine genes were randomly selected for the expression analysis, which showed the highest expression of Gene 6 (Na_Ca_ex gene), and CAX (CAX-interacting protein 4) was higher in manganese (Mn)-treated group. This work provided significant number of full-length transcripts and refined the annotation of the reference genome, which will ease advanced genetic analyses of <italic>S. superba.</italic></p>
</abstract>
<kwd-group>
<kwd><italic>Schima superba</italic></kwd>
<kwd>manganese</kwd>
<kwd>transcriptome</kwd>
<kwd>full-length transcript</kwd>
<kwd>alternative splicing</kwd>
</kwd-group>
<counts>
<fig-count count="8"/>
<table-count count="6"/>
<equation-count count="0"/>
<ref-count count="36"/>
<page-count count="10"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p><italic>Schima superba</italic> is naturally grown in mining areas and abundantly absorbs different metals, particularly manganese (Mn). Due to this absorbance ability, this tree is being used as phytoremediation agent in metal toxic soils (<xref ref-type="bibr" rid="B32">Yang et al., 2008</xref>). This tree belongs to the family Theaceae, and it is commonly used for gardening and forest firebreak. Characteristically, the leaves of this tree contain an unusual high concentration of Mn (<xref ref-type="bibr" rid="B33">Yang et al., 2021</xref>).</p>
<p>Hyper-accumulation of harmful metals in different plants helps in cleaning or decontaminating soils. Contamination of metals in the soil can be reduced through plants&#x2019; absorbance and transportation, which is a kind of green environmental remediation technology (<xref ref-type="bibr" rid="B19">Padmavathiamma and Li, 2007</xref>). Woody plants have high biomass and long-life cycle, and those are unique advantages in the phytoremediation of heavy metal. But the competency of woody trees to accumulate heavy metals is usually very low, and most of heavy metals are accumulated in the roots of woody trees (<xref ref-type="bibr" rid="B4">Capuana, 2020</xref>). As reported by <xref ref-type="bibr" rid="B2">Baker and Brooks (1989)</xref>, more than 10,000 mg/kg concentrations of Mn in above ground tissues of plants are considered as the hyper-accumulation of Mn. Along with having a potential to accumulate Mn, <italic>S. superba</italic> has vast ecological amplitude, dominant canopy species (<xref ref-type="bibr" rid="B26">Tang et al., 2020</xref>) and has considerable biomass, which suggests its potential use in the soil remediation (<xref ref-type="bibr" rid="B18">Luo et al., 2006</xref>).</p>
<p>Although, researchers have reported the hyper-accumulation of Mn in leaves, roots, and shoots, no study has performed the transcriptomic analysis of <italic>S. superba</italic> till date. Since the establishment of large-scale sequencing technology, transcript sequences have become a significant source of studying gene expression and regulation (<xref ref-type="bibr" rid="B16">Levy and Myers, 2016</xref>). The restriction of sequencing read length in the second-generation, the full-length record acquired by splicing is not finished, and the third-generation sequencing technology signified by Pacific Biosciences (PacBio) has successfully overcome this issue (<xref ref-type="bibr" rid="B13">Jiao and Schneeberger, 2017</xref>; <xref ref-type="bibr" rid="B24">Slatko et al., 2018</xref>). Based on its long-read length, high-quality full-length record can be legitimately acquired to distinguish simple sequence repeat (SSR), fulfill functional annotation of transcripts, and lncRNA (<xref ref-type="bibr" rid="B28">Wang et al., 2015</xref>; <xref ref-type="bibr" rid="B31">Xie et al., 2020</xref>). Transcriptomics provides information of the complete set of RNA transcripts in a specific tissue or cell under different developmental or physiological stages, involving ribosomal RNA, transfer RNA, messenger RNA, and non-coding RNAs. Moreover, it concentrates on the gene expression, gene structure, and function at RNA level that help to reveal the molecular processes involved in various biological mechanisms (<xref ref-type="bibr" rid="B10">Dong and Chen, 2013</xref>).</p>
<p>In this research, a single molecule real-time sequencing (SMRT) has been completed to get the full-length transcriptome of <italic>S. superba</italic>. Utilizing the transcriptome data functional annotations of transcripts, transcriptional factors (TFs) analysis, prediction of lnRNA, and basic sequence repeat (SSR) analysis were performed. In addition, the expression pattern of various genes provides basic understanding of transcriptional regulation of <italic>S. superba</italic>. This study will not only assist future functional genomics research but also provide an avenue for further selective genetic engineering and breeding projects of <italic>S. superba</italic>.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Pot Experiment and Sample Collection</title>
<p>A pot test was carried out in the glasshouse of Shanghai Jiao Tong University, China, by using 1-year-old <italic>S. superba</italic> saplings. For this purpose, 18 saplings, with same growth potential (about 35 cm high), were taken and randomly allocated into two groups: control (CK) and Mn concentration 100 mM (WT), in three replicates. Plant tissues were collected after 1, 5, and 10 days of transplantation in quarter-strength of Hoagland solution. The tissues were collected in liquid nitrogen and processed through the isolation of RNA at &#x2212;80&#x00B0;C.</p>
</sec>
<sec id="S2.SS2">
<title>RNA Extraction</title>
<p>RNA extraction from the collected plant samples (0.2 g leaves) was performed with the RNeasy plus Mini Kit (Qiagen, Valencia, United States). Using the Nano drop ND-1000 (Nano drop Technologies, Rockland, DE, United States) spectrophotometer, its quality and quantity were calculated after observing RNA on agarose gel. By using Qubit<sup>&#x00AE;</sup> RNA Assay Kit and RNA Nano 6000 Assay Kit, RNA quality has been identified clearly.</p>
</sec>
<sec id="S2.SS3">
<title>Library Construction and SMRT Sequencing</title>
<p>For sequencing, C2 sequencing reagents were used in Pacific Biosciences (PacBio) real-time sequencer. Purified RNA was utilized for synthesizing cDNA by SMRT PCR cDNA Synthesis Kit (Clontech, CA, United States). Full-length cDNA of different sizes was selected and cDNA libraries were constructed using the BluePippin<sup>&#x00AE;</sup> (SageScience, Beverly, MA, United States). After BluePippin screening, the fragments were pacified to large-scale PCR to get sufficient total cDNA and evaluate using Qubit fluorometer (Life Technologies, Carlsbad, CA, United States). The libraries&#x2019; uniqueness was maintained by using Agilent Bio analyzer 2100 system and SMRT sequencing was achieved.</p>
</sec>
<sec id="S2.SS4">
<title>Error Correction and Quality Filtering</title>
<p>Sequence statistics were obtained by using the SMRT link 5.1 software. Relevant parameters such as no-polish TRUE, min-length 50, max-drop-fraction 0.8, min-predicted-accuracy 0.8, min-passes 2, min-z score -9999.0, and max-length 15000 were followed to produce CCS by subreading BAM files. The output was CCS.BAM files, which, using pbclassify.py, were categorized into full length and non-full length reads. Full and non-full length FASTA files were fed into the cluster stage, and additional nucleotide errors were corrected by LoRDEC software in the consensus readings. Unnecessary data in the corrected consensus reads were separated using CD-HIT (-c 0.95 -T 6 -G 0 -aL 0.00 -aS 0.99) to acquire final transcripts for the subsequent investigation.</p>
</sec>
<sec id="S2.SS5">
<title>Functional Annotation of Transcripts</title>
<p>We recognized functional annotations matching by searching to the non-redundant nucleotide database (Nr), Swiss-Prot, Pfam, non-supervised orthologous groups egg (NOG), clusters of orthologous groups (COG), eukaryotic orthologous groups (KOG), Gene Ontology (GO), Kyoto Encyclopedia of Genes and Genomes (KEGG), and BLAST alignment databases, and all transcript sequences were examined for homology (<xref ref-type="bibr" rid="B1">Bairoch and Apweiler, 2000</xref>; <xref ref-type="bibr" rid="B17">Li et al., 2002</xref>; <xref ref-type="bibr" rid="B27">Tatusov et al., 2003</xref>; <xref ref-type="bibr" rid="B14">Kanehisa et al., 2004</xref>).</p>
</sec>
<sec id="S2.SS6">
<title>Identification of TFs, lncRNAs, and SSR</title>
<p>Plant transcription factors were predicted using iTAK v1.7a (<xref ref-type="bibr" rid="B35">Zheng et al., 2016</xref>). Four tools, CNCIv2 (<xref ref-type="bibr" rid="B25">Sun et al., 2013</xref>), CPCvcpc-0.9-r2 with e-value &#x201C;1e-10&#x201D; (<xref ref-type="bibr" rid="B15">Kong et al., 2007</xref>), Pfam-scan (E 0.001 -domE 0.001) (<xref ref-type="bibr" rid="B12">Finn et al., 2016</xref>) and PLEKv1.2 with min length 200 (<xref ref-type="bibr" rid="B17">Li et al., 2002</xref>) were chosen to predict candidate lncRNAs. Transcripts predicted with coding capacity by all of the mentioned above tools were separated out, and those without coding prospective were considered as candidate set of lncRNAs.</p>
</sec>
<sec id="S2.SS7">
<title>Development of SSR Markers</title>
<p>Simple sequence repeats were identified by MISA v1.0<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> (<xref ref-type="bibr" rid="B3">Beier et al., 2017</xref>), with default parameters. MISA can recognize seven types of SSR, namely mono, di, tri, tetra, penta, and hexa nucleotide by analyzing transcript sequences. By using tool Batch primer 3, SSR primers were designed. DNA was extracted from <italic>S. superba</italic> for PCR amplification, and the product was extracted in 8% polyacrylamide gel.</p>
</sec>
<sec id="S2.SS8">
<title>qRT-PCR Analysis</title>
<p>All 36 saplings of control group (CK) and Mn-treated group (WT) were utilized by RNA extraction via RNeasy plus Mini Kit (Qiagen, Valencia, United States). The cDNA was synthesized using SMRT PCR cDNA synthesis kit (Clontech, United States). The qRT PCR was performed to see the expression of nine different transporter genes (<xref ref-type="supplementary-material" rid="DS5">Supplementary Table S5</xref>). The reaction mixture consisted of 7.8 &#x03BC;l of cDNA and 10 &#x03BC;l of 2&#x00D7; qPCR. The process involve initial denaturation at 95&#x00B0;C for 10 min, which is followed by 45 cycles of denaturation at 95&#x00B0;C for 15 s, while annealing and extension at 60&#x00B0;C for 60 1 min.</p>
</sec>
</sec>
<sec id="S3">
<title>Results</title>
<sec id="S3.SS1">
<title>SMRT Sequencing Data of <italic>S. superba</italic></title>
<p>Plant tissues were used for RNA extraction and library construction of cDNA. After removing adaptor sequences, a total of 1,311,552,27 low-quality sequences were obtained. It comprised of 1&#x2013;6 kb data. After self-correction of subread sequences (with minPasses = 39), overall 588,479 circular consensus sequence (CCS) were obtained. Moreover, 511,759 full-length non-chimeric (FLNC) picks were also identified. Iterative sequence clustering revealed 167,782 consensus isoforms, with a mean read length of 2187 bp. Together with non-FL sequence, the Quiver program corrected the consistent sequence in each cluster, yielding 163834 high-quality transcripts (high- quality isoforms) with more than 97.65% accuracy. In addition, the low-quality record was corrected with the corresponding sequencing data to enhance the accuracy of the isoforms. Finally, using CD HIT (3.3) tools, 97,520 bar non-redundant transcript sequences were obtained (<xref ref-type="table" rid="T1">Tables 1</xref>, <xref ref-type="table" rid="T2">2</xref> and <xref ref-type="fig" rid="F1">Figure 1</xref>).</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Sequencing data statistics table.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Sample name</td>
<td valign="top" align="center">Sample ID</td>
<td valign="top" align="center">cDNA size</td>
<td valign="top" align="center">SMRT cells</td>
<td valign="top" align="center">Data size</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>Schima superba</italic></td>
<td valign="top" align="center">F01</td>
<td valign="top" align="center">1&#x2013;6 k</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">40 G</td>
</tr>
</tbody>
</table></table-wrap>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Reads summary insert from single molecule long-read sequencing.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Samples</td>
<td valign="top" align="center">cDNA size</td>
<td valign="top" align="center">CCS no.</td>
<td valign="top" align="center">Read bases of CCS</td>
<td valign="top" align="center">Mean read length</td>
<td valign="top" align="center">Mean no. of passes</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">F01</td>
<td valign="top" align="center">1&#x2013;6 k</td>
<td valign="top" align="center">588,479</td>
<td valign="top" align="center">1,311,552,271</td>
<td valign="top" align="center">2,228</td>
<td valign="top" align="center">39</td>
</tr>
<tr>
<td valign="top" align="left">F02</td>
<td valign="top" align="center">All</td>
<td valign="top" align="center">588,479</td>
<td valign="top" align="center">1,311,552,271</td>
<td valign="top" align="center">2,228</td>
<td valign="top" align="center">39</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Length distribution of full-length non-chimeric sequence.</p></caption>
<graphic xlink:href="fgene-12-635043-g001.tif"/>
</fig>
</sec>
<sec id="S4">
<title>Open Reading Frame and AS Event Prediction</title>
<p>About 93,362 ORFs were predicted using Trans Decoder software. Overall, 78,255 complete ORFs were recognized, and the complete ORFs were successfully analyzed for length distribution (<xref ref-type="fig" rid="F2">Figure 2</xref>); 7,489 AS events were revealed out of all transcripts obtained by SMRT sequencing (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table S1</xref>). Owing to the lack of an unavailable <italic>S. Superba</italic> reference genome, the classification of the forms of AS events in future research would be justified (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Division of predicted CDS-encoded protein length.</p></caption>
<graphic xlink:href="fgene-12-635043-g002.tif"/>
</fig>
</sec>
<sec id="S4.SS1">
<title>Long Non-coding RNA Identification</title>
<p>These are a group of non-coding poly-A RNAs that are involved in growth and stress response of the plant. In this work, we utilize four computational methods to recognize lncRNAs, associated with Pfam, CPC, CPAT, and CNCI databases. Overall, 8,551, 9,174, 20,720, and 18,669 lncRNAs were recognized in the Pfam, CPC, CPAT, and CNCI, respectively (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table S2</xref>). By filtering the record of less than 300 bp, 2,011 transcripts were examined as lncRNAs by all four mechanisms (<xref ref-type="fig" rid="F3">Figure 3</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>LncRNAs predicted by the CNCI, CPAT, Pfam, and CPC protein structure domain analysis.</p></caption>
<graphic xlink:href="fgene-12-635043-g003.tif"/>
</fig>
</sec>
<sec id="S4.SS2">
<title>Transcription Factor Prediction</title>
<p>These are the key regulators of gene expression and play a significant role in plant growth and development. In this study, TFs are divided into 64 families, and 9423 putative TFs were identified (<xref ref-type="supplementary-material" rid="DS3">Supplementary Table S3</xref>). TFs in <italic>S. superba</italic> transcriptome were mostly related to the RLK-Pelle-DLS (473,5.02%), bHLH (278,2.95%), MYB-related (230,2.44%), CAMK-CDPK (218,2.31%), C2H2 (218,2.31%), C3H (202,2.14%), RWP-RK (189,2.01%), bZIP (177,1.88%), TKL-PI-4 (159,1.69%), and NAC (152,1.61%) families (<xref ref-type="fig" rid="F4">Figure 4</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Distribution of transcription factor types.</p></caption>
<graphic xlink:href="fgene-12-635043-g004.tif"/>
</fig>
</sec>
<sec id="S4.SS3">
<title>Functional Annotation of Transcripts</title>
<p>All 16,3834 unique SMRT transcripts were practically annotated by seven data storage, such as GO, KOG, Pfam, Swiss-Prot, COG, Nr, and KEGG using BLAST (7) software [version 2.2.26] (<xref ref-type="table" rid="T3">Table 3</xref>). By comparing the transcript sequence to NR with homologous species, 68,630 genes were annotated (<xref ref-type="fig" rid="F5">Figure 5</xref>).</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Functional annotation of <italic>S. superba</italic> transcriptome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Annotated databases</td>
<td valign="top" align="center">Isoform number</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">COG</td>
<td valign="top" align="center">38,914</td>
</tr>
<tr>
<td valign="top" align="left">GO</td>
<td valign="top" align="center">71,839</td>
</tr>
<tr>
<td valign="top" align="left">KEGG</td>
<td valign="top" align="center">38,376</td>
</tr>
<tr>
<td valign="top" align="left">KOG</td>
<td valign="top" align="center">58,193</td>
</tr>
<tr>
<td valign="top" align="left">PfAM</td>
<td valign="top" align="center">73,647</td>
</tr>
<tr>
<td valign="top" align="left">Eggnog</td>
<td valign="top" align="center">89,727</td>
</tr>
<tr>
<td valign="top" align="left">Swiss-Prot</td>
<td valign="top" align="center">66,790</td>
</tr>
<tr>
<td valign="top" align="left">Nr</td>
<td valign="top" align="center">91,082</td>
</tr>
<tr>
<td valign="top" align="left">All</td>
<td valign="top" align="center">91,617</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Species distribution of <italic>S. superba</italic> transcriptome annotated in the Nr database.</p></caption>
<graphic xlink:href="fgene-12-635043-g005.tif"/>
</fig>
</sec>
<sec id="S4.SS4">
<title>GO Classified Transcripts</title>
<p>Transcripts GO classification statistics demonstrated 71,839 unique genes, which were enriched in major categories of molecular function, cellular component, biological component, and catalytic activity (<xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F5">5</xref>). This analysis also helped us to get transcripts COG classification statistics (<xref ref-type="fig" rid="F6">Figure 6</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Transcript GO annotation classification statistics graph.</p></caption>
<graphic xlink:href="fgene-12-635043-g006.tif"/>
</fig>
</sec>
<sec id="S4.SS5">
<title>COG Classification</title>
<p>To examine the functional annotation and classification of <italic>S. Superba</italic> for further study, all the transcripts were checked against the COG database clusters<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>. This investigation indicated that 38,914 transcripts were allocated into 24 categories (<xref ref-type="fig" rid="F7">Figure 7</xref>). The highest group was general function prediction only (4,690, 11.1%), followed by signal transduction (4,291, 10.15%) whereas carbohydrate transport and metabolism was 3,981, 9.42%. Our results revealed six groups percentage were less than 1.00%, i.e., nuclear structure and modification, chromatin structure and dynamics including extracellular structure (<xref ref-type="fig" rid="F7">Figure 7</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>COG annotation classification statistics of transcripts.</p></caption>
<graphic xlink:href="fgene-12-635043-g007.tif"/>
</fig>
</sec>
<sec id="S4.SS6">
<title>KEGG Annotated Transcripts</title>
<p>KEGG data storage interpreted a total of 67,426 sequences and plotted 367 operative categories in <italic>S. superba</italic>. Among them, metabolism was the largest category. The functional annotations of all 78,559 unique transcripts were detected in this work (<xref ref-type="supplementary-material" rid="DS4">Supplementary Table S4</xref>). A significant number of genes, especially interrelated in salt-tolerance and fatty acid component of <italic>S. superba</italic> were annotated, such as oxidative phosphorylation (1073), plant hormone signal transduction (506), fatty acid biosynthesis (246), biosynthesis of unsaturated fatty acids (94), and &#x03B1;-linolenic acid metabolism (199). We also recognized matches to our unique transcripts in clusters of orthologous class of proteins (COG) (44,376, 56.49%), Pfam database (41,535, 52.87%), and Swiss-Prot (58,535, 74.51%) (<xref ref-type="table" rid="T4">Table 4</xref>).</p>
<table-wrap position="float" id="T4">
<label>TABLE 4</label>
<caption><p>Topmost pathways annotated by the KEGG database.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">No.</td>
<td valign="top" align="left">Name of pathways</td>
<td valign="top" align="center">Pathway ID</td>
<td valign="top" align="center">Transcripts (%)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1.</td>
<td valign="top" align="left">Carbon metabolism</td>
<td valign="top" align="center">ko01200</td>
<td valign="top" align="center">886(9.68%)</td>
</tr>
<tr>
<td valign="top" align="left">2.</td>
<td valign="top" align="left">Protein of processing in endoplasmic reticulum</td>
<td valign="top" align="center">Ko04141</td>
<td valign="top" align="center">462 (5.05%)</td>
</tr>
<tr>
<td valign="top" align="left">3.</td>
<td valign="top" align="left">Biosynthesis of amino acid</td>
<td valign="top" align="center">ko01230</td>
<td valign="top" align="center">621 (6.79%)</td>
</tr>
<tr>
<td valign="top" align="left">4.</td>
<td valign="top" align="left">Spliceosome</td>
<td valign="top" align="center">ko03040</td>
<td valign="top" align="center">520 (5.68%)</td>
</tr>
<tr>
<td valign="top" align="left">5.</td>
<td valign="top" align="left">Ribosome</td>
<td valign="top" align="center">ko03010</td>
<td valign="top" align="center">332 (3.63%)</td>
</tr>
<tr>
<td valign="top" align="left">6.</td>
<td valign="top" align="left">RNA transport</td>
<td valign="top" align="center">ko03013</td>
<td valign="top" align="center">356 (3.89%)</td>
</tr>
<tr>
<td valign="top" align="left">7.</td>
<td valign="top" align="left">Sucrose and starch metabolism</td>
<td valign="top" align="center">ko00500</td>
<td valign="top" align="center">384 (4.20%)</td>
</tr>
<tr>
<td valign="top" align="left">8.</td>
<td valign="top" align="left">Plant hormone signal transduction</td>
<td valign="top" align="center">ko04075</td>
<td valign="top" align="center">401 (4.38%)</td>
</tr>
<tr>
<td valign="top" align="left">9.</td>
<td valign="top" align="left">Oxidative phosphorylation</td>
<td valign="top" align="center">ko00190</td>
<td valign="top" align="center">240 (2.62%)</td>
</tr>
<tr>
<td valign="top" align="left">10.</td>
<td valign="top" align="left">Glycolysis/gluconeogenesis</td>
<td valign="top" align="center">ko00010</td>
<td valign="top" align="center">350 (3.82%)</td>
</tr>
<tr>
<td valign="top" align="left">11.</td>
<td valign="top" align="left">Plant pathogen interaction</td>
<td valign="top" align="center">ko04626</td>
<td valign="top" align="center">388 (4.24%)</td>
</tr>
<tr>
<td valign="top" align="left">12.</td>
<td valign="top" align="left">mRNA surveillance pathway</td>
<td valign="top" align="center">ko03015</td>
<td valign="top" align="center">339 (3.7%)</td>
</tr>
<tr>
<td valign="top" align="left">13.</td>
<td valign="top" align="left">Ubiquitin mediated proteolysis</td>
<td valign="top" align="center">ko04120</td>
<td valign="top" align="center">253 (2.76%)</td>
</tr>
<tr>
<td valign="top" align="left">14.</td>
<td valign="top" align="left">Amino sugar and nucleotide sugar metabolism</td>
<td valign="top" align="center">ko00520</td>
<td valign="top" align="center">245 (2.68%)</td>
</tr>
<tr>
<td valign="top" align="left">15.</td>
<td valign="top" align="left">Endocytosis</td>
<td valign="top" align="center">ko04144</td>
<td valign="top" align="center">270 (2.95%)</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S4.SS7">
<title>Analysis of Gene Expression in qRT PCR</title>
<p>For the expression analysis of potential high expression genes, nine transporter genes were selected randomly for qRT PCR. Results of qRT PCR analysis showed the highest expression by Gene 6 (Na_Ca_ex), in Mn-treated group (WT) on day 1, 5, and 10, while the expression of CAX (CAX-interacting protein 4) was higher in Mn-treated group (WT) at day 5 (<xref ref-type="fig" rid="F8">Figure 8</xref>).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption><p>Expression of genes in control group (CK) and Mn-treated group (WT) at day 1, day 5, and day 10. Error bars represent the standard deviation.</p></caption>
<graphic xlink:href="fgene-12-635043-g008.tif"/>
</fig>
</sec>
<sec id="S4.SS8">
<title>SSR Identification</title>
<p>After the screening of 95,258 obtained transcripts, about 58,396 possible SSRs were recognized from 29,075 transcripts. Among them 26,312 composed one SSR, and 19,007 contained two loci or more. In addition, 29,075 and 18,324 transcripts contained one SSR and at least two SSRs, respectively. Whereas observed compound formations were 18,324 SSRs. As shown in <xref ref-type="table" rid="T5">Table 5</xref>, the number of mono-, di-, tri-, tetra-, penta-, and hexa-nucleotide repeats were 44,045, 51,716, 14,521, 1,675, 753, and 988, accordingly. SSRs with 10 repeat units (16949, 14.9%) were the most abundant, followed by those with 6 (12563, 11%), 11 (10564, 9.2%), and 7 (7995, 87.03%) (<xref ref-type="table" rid="T6">Table 6</xref>).</p>
<table-wrap position="float" id="T5">
<label>TABLE 5</label>
<caption><p>Summary of SSR identified in <italic>Schima superba.</italic></p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Searching item</td>
<td valign="top" align="center">Numbers</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Total no. of sequence examined</td>
<td valign="top" align="center">95,258</td>
</tr>
<tr>
<td valign="top" align="left">Total size of examined sequences (bp)</td>
<td valign="top" align="center">225,274,809</td>
</tr>
<tr>
<td valign="top" align="left">No. of SSR containing sequences</td>
<td valign="top" align="center">58,396</td>
</tr>
<tr>
<td valign="top" align="left">No. of sequences containing more than one SSR</td>
<td valign="top" align="center">29,075</td>
</tr>
<tr>
<td valign="top" align="left">No. of SSRs present in compound formation</td>
<td valign="top" align="center">18,324</td>
</tr>
<tr>
<td valign="top" align="left">Mono-nucleotide</td>
<td valign="top" align="center">44,045</td>
</tr>
<tr>
<td valign="top" align="left">Di-nucleotide</td>
<td valign="top" align="center">51,716</td>
</tr>
<tr>
<td valign="top" align="left">Tri-nucleotide</td>
<td valign="top" align="center">14,521</td>
</tr>
<tr>
<td valign="top" align="left">Tetra-nucleotide</td>
<td valign="top" align="center">1,675</td>
</tr>
<tr>
<td valign="top" align="left">Penta-nucleotide</td>
<td valign="top" align="center">753</td>
</tr>
<tr>
<td valign="top" align="left">Hexa-nucleotide</td>
<td valign="top" align="center">988</td>
</tr>
</tbody>
</table></table-wrap>
<table-wrap position="float" id="T6">
<label>TABLE 6</label>
<caption><p>SSRs distribution based on the number of repeat units.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">No. of repeat units</td>
<td valign="top" align="center">Mono</td>
<td valign="top" align="center">Di</td>
<td valign="top" align="center">Tri</td>
<td valign="top" align="center">Tetra</td>
<td valign="top" align="center">Penta</td>
<td valign="top" align="center">Hexa</td>
<td valign="top" align="center">Total</td>
<td valign="top" align="center">Percentage</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">6914</td>
<td valign="top" align="center">1146</td>
<td valign="top" align="center">573</td>
<td valign="top" align="center">763</td>
<td valign="top" align="center">9396</td>
<td valign="top" align="center">8.263997608</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">8785</td>
<td valign="top" align="center">3099</td>
<td valign="top" align="center">353</td>
<td valign="top" align="center">150</td>
<td valign="top" align="center">176</td>
<td valign="top" align="center">12563</td>
<td valign="top" align="center">11.04944678</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">6163</td>
<td valign="top" align="center">1661</td>
<td valign="top" align="center">113</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">7995</td>
<td valign="top" align="center">7.031785959</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">5669</td>
<td valign="top" align="center">977</td>
<td valign="top" align="center">44</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">6708</td>
<td valign="top" align="center">5.899839927</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">5588</td>
<td valign="top" align="center">734</td>
<td valign="top" align="center">17</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">6339</td>
<td valign="top" align="center">5.575295959</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="center">11953</td>
<td valign="top" align="center">4542</td>
<td valign="top" align="center">452</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">16949</td>
<td valign="top" align="center">14.90703442</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="center">7151</td>
<td valign="top" align="center">3099</td>
<td valign="top" align="center">314</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">10564</td>
<td valign="top" align="center">9.29128041</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="center">5263</td>
<td valign="top" align="center">2203</td>
<td valign="top" align="center">178</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">7644</td>
<td valign="top" align="center">6.723073405</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="center">3813</td>
<td valign="top" align="center">2115</td>
<td valign="top" align="center">82</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">6010</td>
<td valign="top" align="center">5.28593291</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="center">3294</td>
<td valign="top" align="center">2111</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">5450</td>
<td valign="top" align="center">4.79340006</td>
</tr>
<tr>
<td valign="top" align="left">&#x2265;15</td>
<td valign="top" align="center">12571</td>
<td valign="top" align="center">11441</td>
<td valign="top" align="center">65</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">24080</td>
<td valign="top" align="center">21.17891256</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S4.SS9">
<title>Development of SSR Markers</title>
<p>By using Primer 3.0 software, 95,374 pair of primers were designed, and among them, 200 were randomly selected for PCR (<xref ref-type="supplementary-material" rid="DS6">Supplementary Table S6</xref>). The product of 180 PCR pairs was examined successfully, with an efficiency rate of 90%. However, the remaining 20 pairs of primer failed to amplify at various annealing temperatures.</p>
</sec>
</sec>
<sec id="S5">
<title>Discussion</title>
<p>Since the development of high-throughput sequencing technology, transcriptomic analysis has become a valuable technology to study gene expression and regulation (<xref ref-type="bibr" rid="B28">Wang et al., 2015</xref>; <xref ref-type="bibr" rid="B8">Dharshini et al., 2016</xref>). However, due to read length limitation of the second-generation sequencing in different organisms, the full-length transcript obtained by splicing is not complete (<xref ref-type="bibr" rid="B22">Rhoads and Au, 2015</xref>). SMRT sequencing technology effectively solves this problem. This study is the first transcriptome analysis of <italic>S. superba</italic> using SMRT sequencing technology. The sequencing peaks were gained from leaf samples using the Pacific Biosciences Iso-Seq platform. After sequencing, 511,759 full-length non-chimerics (FLNC) were identified. Previous studies also reported similar results that newly discovered transcripts by SMRT in red clover and wheat were 45 bp longer than the known transcripts (<xref ref-type="bibr" rid="B9">Dong et al., 2015</xref>; <xref ref-type="bibr" rid="B5">Chao et al., 2018</xref>). Subsequently, our results also showed that the SMRT technology is very efficient for full-length cDNA sequencing and provided a rich resource for further functional genomics analysis in <italic>S. superba</italic> (<xref ref-type="bibr" rid="B30">Workman et al., 2018</xref>; <xref ref-type="bibr" rid="B36">Zuo et al., 2018</xref>).</p>
<p>In past years, PacBio platform was used to sequence the full-length transcriptional group of tea (<italic>Camellia sinensis</italic>) (<xref ref-type="bibr" rid="B21">Qiao et al., 2019</xref>). Finally, 213,389 polished consensus sequences were obtained, 223,120 CDS sequences were predicted, 195,062 SSR loci were detected, and 5,785 transcription factors belonging to 60 transcription factor families were predicted. PacBio RS II platform was used to analyze the full-length transcription group of sunflowers, 10.43 Gb clean data were obtained, and 38,302 de-redundant sequences were obtained (<xref ref-type="bibr" rid="B7">Chen et al., 2018</xref>). Previous research on <italic>S. superba</italic> was mainly focused on genetic mapping, gene expression, and proteomic analysis (<xref ref-type="bibr" rid="B6">Chen et al., 2014</xref>; <xref ref-type="bibr" rid="B34">Zhang et al., 2019</xref>, <xref ref-type="bibr" rid="B33">Yang et al., 2021</xref>). However, these techniques could not provide and assembled full-length transcripts. On the other hand, PacBio SMRT single-molecule long-read sequencing revealed a better capacity in capturing transcript sequences, mainly long transcript sequences. The transcriptome sequencing of 18 samples was completed, and a total of 124.45 G of clean data were obtained, with Q30 reaching 85%. These data were corrected by Illumina clean reads, after the integration and quality control of data from the two platforms. After sequencing, 588,479 circular consensus (CCS) reads were obtained, including 511,759 full-length reads non-chimeric (FLNC) sequences. Previous studies showed that the length of the FLNC sequence emulates the length of the cDNA sequence in whole sequence library, whereas the library can be examined by the length of FLNC sequence (<xref ref-type="bibr" rid="B5">Chao et al., 2018</xref>). The full-length non-chimeric sequences were clustered to obtain 167,782 consensus sequences, and 163,834 high-quality consensus sequences were obtained by polishing the consensus sequences. The low-quality consensus sequences were corrected with the second-generation transcriptome data, and they were consistent with high-quality. The sequences were merged and subjected to de-redundancy analysis to obtain 41,112 transcript sequences. Each sample obtained 7,489 alternative splicing, and a total of 113,698 SSR and 78,255 complete CDS regions were obtained. Previous studies showed variations in the percentage of tetra, penta, and hexa nucleotide repeats observed in sorghum (5.4%), rice (2.54%), Populus (1.66%), and Medicago (0.94%) (Ref 4). Our findings of sequence library provide basic information for improving the <italic>S. superba</italic> draft genome annotation and complete characterization of this species transcriptome.</p>
<p>Results of qRT PCR analysis indicated the highest expression of Gene 6 (CAX-interacting protein 4), in Mn-treated group (WT) on day 1, 5, and 10. Our results are similar with the study of <xref ref-type="bibr" rid="B20">Pittman and Hirschi (2016)</xref>. Previous studies indicated that CAX shows high expression under salt stress. Moreover, the higher expression of CAX (Na_Ca_ex) in Mn-treated group (WT) was also observed. The CAX proteins are one of the five transporter families that constitute Ca<sup>2+</sup>/cation antiporters (CaCA) superfamily (<xref ref-type="bibr" rid="B23">Shigaki et al., 2006</xref>; <xref ref-type="bibr" rid="B11">Emery et al., 2012</xref>). Although the CAX family members were at first identified as Ca<sup>2+</sup> transporters, related work revealed their ability to transport a wide array of ions (<xref ref-type="bibr" rid="B20">Pittman and Hirschi, 2016</xref>). In plants, the CAXs mediate efflux of ions present into the vacuole. This study has provided enriched information about expression and regulation of genes in stress conditions of <italic>S. superba</italic>. In addition, this study provided for the first time a full-length transcriptome of the <italic>S. superba</italic> using the SMRT sequencing method. The transcriptome design in this research will assist future research on functional genomics and facilitate support for advance genetic engineering of <italic>S. superba</italic>.</p>
</sec>
<sec id="S6">
<title>Data Availability Statement</title>
<p>Data are available at the SRA portal (<ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/sra/PRJNA679388">https://www.ncbi.nlm.nih.gov/sra/PRJNA679388</ext-link>) of NCBI, accession number: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA679388">PRJNA679388</ext-link>.</p>
</sec>
<sec id="S7">
<title>Author Contributions</title>
<p>QL designed the experiments and supervised the research work. FL executed the experiments and wrote the manuscript. MM analyzed the results and formatted the manuscript. SA, UH, and JS did data compilation. WZ and SS did analyses and sample collection. SC supervised the research work. All authors read and approved the final manuscript.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This research is financially supported by Shanghai Sciences and Technology Commission, Project No: 18DZ2283500.</p>
</fn>
</fn-group>
<sec id="S9" sec-type="supplementary material"><title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.635043/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.635043/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="DS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 1</label>
<caption><p>Summary of the predicted alternative splicing (AS) events.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_3.PDF" id="DS2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 2</label>
<caption><p>Summary of lncRNA predicted by CPC, CNCI, CPAT, and Pfam protein structure domain analysis.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_6.PDF" id="DS3" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 3</label>
<caption><p>Summary of identified TFs.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_2.PDF" id="DS4" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 4</label>
<caption><p>Summary of the transcripts annotated to the reference canonical pathways in the KEGG database.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_4.PDF" id="DS5" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 5</label>
<caption><p>The primers used for qRT-PCR analysis.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_5.PDF" id="DS6" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 6</label>
<caption><p>The characterization of EST-SSR markers.</p></caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bairoch</surname> <given-names>A.</given-names></name> <name><surname>Apweiler</surname> <given-names>R.</given-names></name></person-group> (<year>2000</year>). <article-title>The SWISS-PROT protein sequence database and its supplement TrEMBL in 2000.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>28</volume> <fpage>45</fpage>&#x2013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.1093/nar/28.1.45</pub-id> <pub-id pub-id-type="pmid">10592178</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baker</surname> <given-names>A. J.</given-names></name> <name><surname>Brooks</surname> <given-names>R.</given-names></name></person-group> (<year>1989</year>). <article-title>Terrestrial higher plants which hyperaccumulate metallic elements. a review of their distribution, ecology and phytochemistry.</article-title> <source><italic>Biorecovery</italic></source> <volume>12</volume> <fpage>81</fpage>&#x2013;<lpage>126</lpage>.</citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beier</surname> <given-names>S.</given-names></name> <name><surname>Thiel</surname> <given-names>T.</given-names></name> <name><surname>M&#x00FC;nch</surname> <given-names>T.</given-names></name> <name><surname>Scholz</surname> <given-names>U.</given-names></name> <name><surname>Mascher</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>MISA-web: a web server for microsatellite prediction.</article-title> <source><italic>Bioinformatics</italic></source> <volume>33</volume> <fpage>2583</fpage>&#x2013;<lpage>2585</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx198</pub-id> <pub-id pub-id-type="pmid">28398459</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Capuana</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>A review of the performance of woody and herbaceous ornamental plants for phytoremediation in urban areas.</article-title> <source><italic>IForest</italic></source> <volume>13</volume>:<issue>139</issue>. <pub-id pub-id-type="doi">10.3832/ifor3242-013</pub-id> <pub-id pub-id-type="pmid">17959540</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chao</surname> <given-names>Y.</given-names></name> <name><surname>Yuan</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Jia</surname> <given-names>S.</given-names></name> <name><surname>Han</surname> <given-names>L.</given-names></name> <name><surname>Xu</surname> <given-names>L.</given-names></name></person-group> (<year>2018</year>). <article-title>Analysis of transcripts and splice isoforms in red clover (<italic>Trifolium pratense</italic> L.) by single-molecule long-read sequencing.</article-title> <source><italic>BMC Plant Biol.</italic></source> <volume>18</volume>:<issue>300</issue>. <pub-id pub-id-type="doi">10.1186/s12870-018-1534-8</pub-id> <pub-id pub-id-type="pmid">30477428</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Hu</surname> <given-names>W. J.</given-names></name> <name><surname>Wang</surname> <given-names>C.</given-names></name> <name><surname>Liu</surname> <given-names>T. W.</given-names></name> <name><surname>Chalifour</surname> <given-names>A.</given-names></name> <name><surname>Shen</surname> <given-names>Z. J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Proteomic analysis reveals differences in tolerance to acid rain in two broad-leaf tree species, <italic>Liquidambar formosana</italic> and <italic>Schima superba</italic>.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e102532</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0102532</pub-id> <pub-id pub-id-type="pmid">25025692</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Tang</surname> <given-names>X.</given-names></name> <name><surname>Ren</surname> <given-names>C.</given-names></name> <name><surname>Wei</surname> <given-names>B.</given-names></name> <name><surname>Wu</surname> <given-names>Y.</given-names></name> <name><surname>Wu</surname> <given-names>Q.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Full-length transcriptome sequences and the identification of putative genes for flavonoid biosynthesis in safflower.</article-title> <source><italic>BMC Genomics</italic></source> <volume>19</volume>:<issue>548</issue>. <pub-id pub-id-type="doi">10.1186/s12864-018-4946-9</pub-id> <pub-id pub-id-type="pmid">30041604</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dharshini</surname> <given-names>S.</given-names></name> <name><surname>Chakravarthi</surname> <given-names>M.</given-names></name> <name><surname>Manoj</surname> <given-names>V. M.</given-names></name> <name><surname>Naveenarani</surname> <given-names>M.</given-names></name> <name><surname>Kumar</surname> <given-names>R.</given-names></name> <name><surname>Meena</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>De novo sequencing and transcriptome analysis of a low temperature tolerant <italic>Saccharum spontaneum</italic> clone IND 00-1037.</article-title> <source><italic>J. Biotechnol.</italic></source> <volume>231</volume> <fpage>280</fpage>&#x2013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiotec.2016.05.036</pub-id> <pub-id pub-id-type="pmid">27269250</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Kong</surname> <given-names>G.</given-names></name> <name><surname>Chu</surname> <given-names>J. S.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Single-molecule real-time transcript sequencing facilitates common wheat genome annotation and grain transcriptome research.</article-title> <source><italic>BMC Genomics</italic></source> <volume>16</volume>:<issue>1039</issue>. <pub-id pub-id-type="doi">10.1186/s12864-015-2257-y</pub-id> <pub-id pub-id-type="pmid">26645802</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name></person-group> (<year>2013</year>). <article-title>Transcriptomics: advances and approaches.</article-title> <source><italic>Sci. China Life Sci.</italic></source> <volume>56</volume> <fpage>960</fpage>&#x2013;<lpage>967</lpage>. <pub-id pub-id-type="doi">10.1007/s11427-013-4557-2</pub-id> <pub-id pub-id-type="pmid">24091688</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emery</surname> <given-names>L.</given-names></name> <name><surname>Whelan</surname> <given-names>S.</given-names></name> <name><surname>Hirschi</surname> <given-names>K. D.</given-names></name> <name><surname>Pittman</surname> <given-names>J. K.</given-names></name></person-group> (<year>2012</year>). <article-title>Protein phylogenetic analysis of Ca2+/cation antiporters and insights into their evolution in plants.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>3</volume>:<issue>1</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2012.00001</pub-id> <pub-id pub-id-type="pmid">22645563</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finn</surname> <given-names>R. D.</given-names></name> <name><surname>Coggill</surname> <given-names>P.</given-names></name> <name><surname>Eberhardt</surname> <given-names>R. Y.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name> <name><surname>Mistry</surname> <given-names>J.</given-names></name> <name><surname>Mitchell</surname> <given-names>A. L.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The Pfam protein families database: towards a more sustainable future.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <fpage>D279</fpage>&#x2013;<lpage>D285</lpage>.</citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jiao</surname> <given-names>W. B.</given-names></name> <name><surname>Schneeberger</surname> <given-names>K.</given-names></name></person-group> (<year>2017</year>). <article-title>The impact of third generation genomic technologies on plant genome assembly.</article-title> <source><italic>Curr. Opin. Plant Biol.</italic></source> <volume>36</volume> <fpage>64</fpage>&#x2013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1016/j.pbi.2017.02.002</pub-id> <pub-id pub-id-type="pmid">28231512</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Goto</surname> <given-names>S.</given-names></name> <name><surname>Kawashima</surname> <given-names>S.</given-names></name> <name><surname>Okuno</surname> <given-names>Y.</given-names></name> <name><surname>Hattori</surname> <given-names>M.</given-names></name></person-group> (<year>2004</year>). <article-title>The KEGG resource for deciphering the genome.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>D277</fpage>&#x2013;<lpage>D280</lpage>.</citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kong</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Ye</surname> <given-names>Z. Q.</given-names></name> <name><surname>Liu</surname> <given-names>X. Q.</given-names></name> <name><surname>Zhao</surname> <given-names>S. Q.</given-names></name> <name><surname>Wei</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>CPC: assess the protein-coding potential of transcripts using sequence features and support vector machine.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>35</volume> <fpage>W345</fpage>&#x2013;<lpage>W349</lpage>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levy</surname> <given-names>S. E.</given-names></name> <name><surname>Myers</surname> <given-names>R. M.</given-names></name></person-group> (<year>2016</year>). <article-title>Advancements in next-generation sequencing.</article-title> <source><italic>Annu. Rev. Genomics Hum. Genet.</italic></source> <volume>17</volume> <fpage>95</fpage>&#x2013;<lpage>115</lpage>.</citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Jaroszewski</surname> <given-names>L.</given-names></name> <name><surname>Godzik</surname> <given-names>A.</given-names></name></person-group> (<year>2002</year>). <article-title>Tolerating some redundancy significantly speeds up clustering of large protein databases.</article-title> <source><italic>Bioinformatics</italic></source> <volume>18</volume> <fpage>77</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/18.1.77</pub-id> <pub-id pub-id-type="pmid">11836214</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>C.</given-names></name> <name><surname>Shen</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Baker</surname> <given-names>A. J.</given-names></name></person-group> (<year>2006</year>). <article-title>Enhanced phytoextraction of Pb and other metals from artificially contaminated soils through the combined application of EDTA and EDDS.</article-title> <source><italic>Chemosphere</italic></source> <volume>63</volume> <fpage>1773</fpage>&#x2013;<lpage>1784</lpage>. <pub-id pub-id-type="doi">10.1016/j.chemosphere.2005.09.050</pub-id> <pub-id pub-id-type="pmid">16297960</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Padmavathiamma</surname> <given-names>P. K.</given-names></name> <name><surname>Li</surname> <given-names>L. Y.</given-names></name></person-group> (<year>2007</year>). <article-title>Phytoremediation technology: hyper-accumulation metals in plants.</article-title> <source><italic>Water Air Soil Pollut.</italic></source> <volume>184</volume> <fpage>105</fpage>&#x2013;<lpage>126</lpage>. <pub-id pub-id-type="doi">10.1007/s11270-007-9401-5</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pittman</surname> <given-names>J. K.</given-names></name> <name><surname>Hirschi</surname> <given-names>K. D.</given-names></name></person-group> (<year>2016</year>). <article-title>CAX-ing a wide net: cation/H+ transporters in metal remediation and abiotic stress signalling.</article-title> <source><italic>Plant Biol.</italic></source> <volume>18</volume> <fpage>741</fpage>&#x2013;<lpage>749</lpage>. <pub-id pub-id-type="doi">10.1111/plb.12460</pub-id> <pub-id pub-id-type="pmid">27061644</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qiao</surname> <given-names>D.</given-names></name> <name><surname>Yang</surname> <given-names>C.</given-names></name> <name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Guo</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Niu</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Comprehensive identification of the full-length transcripts and alternative splicing related to the secondary metabolism pathways in the tea plant (<italic>Camellia sinensis</italic>).</article-title> <source><italic>Sci. Rep.</italic></source> <volume>9</volume>:<issue>2709</issue>.</citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rhoads</surname> <given-names>A.</given-names></name> <name><surname>Au</surname> <given-names>K. F.</given-names></name></person-group> (<year>2015</year>). <article-title>PacBio sequencing and its applications.</article-title> <source><italic>Genomics Proteomics Bioinformatics</italic></source> <volume>13</volume> <fpage>278</fpage>&#x2013;<lpage>289</lpage>. <pub-id pub-id-type="doi">10.1016/j.gpb.2015.08.002</pub-id> <pub-id pub-id-type="pmid">26542840</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shigaki</surname> <given-names>T.</given-names></name> <name><surname>Rees</surname> <given-names>I.</given-names></name> <name><surname>Nakhleh</surname> <given-names>L.</given-names></name> <name><surname>Hirschi</surname> <given-names>K. D.</given-names></name></person-group> (<year>2006</year>). <article-title>Identification of three distinct phylogenetic groups of CAX cation/proton antiporters.</article-title> <source><italic>J. Mol. Evol.</italic></source> <volume>63</volume> <fpage>815</fpage>&#x2013;<lpage>825</lpage>. <pub-id pub-id-type="doi">10.1007/s00239-006-0048-4</pub-id> <pub-id pub-id-type="pmid">17086450</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Slatko</surname> <given-names>B. E.</given-names></name> <name><surname>Gardner</surname> <given-names>A. F.</given-names></name> <name><surname>Ausubel</surname> <given-names>F. M.</given-names></name></person-group> (<year>2018</year>). <article-title>Overview of next-generation sequencing technologies.</article-title> <source><italic>Curr. Protoc. Mol. Biol.</italic></source> <volume>122</volume>:<issue>e59</issue>.</citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>L.</given-names></name> <name><surname>Luo</surname> <given-names>H.</given-names></name> <name><surname>Bu</surname> <given-names>D.</given-names></name> <name><surname>Zhao</surname> <given-names>G.</given-names></name> <name><surname>Yu</surname> <given-names>K.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Utilizing sequence intrinsic composition to classify protein-coding and long non-coding transcripts.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>41</volume>:<issue>e166</issue>. <pub-id pub-id-type="doi">10.1093/nar/gkt646</pub-id> <pub-id pub-id-type="pmid">23892401</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>C. Q.</given-names></name> <name><surname>Han</surname> <given-names>P. B.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Shen</surname> <given-names>L. Q.</given-names></name> <name><surname>Huang</surname> <given-names>D. S.</given-names></name> <name><surname>Li</surname> <given-names>Y. F.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Species richness, forest types and regeneration of Schima in the subtropical forest ecosystem of Yunnan, southwestern China.</article-title> <source><italic>For. Ecosyst.</italic></source> <volume>7</volume> <fpage>1</fpage>&#x2013;<lpage>19</lpage>.</citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tatusov</surname> <given-names>R. L.</given-names></name> <name><surname>Fedorova</surname> <given-names>N. D.</given-names></name> <name><surname>Jackson</surname> <given-names>J. D.</given-names></name> <name><surname>Jacobs</surname> <given-names>A. R.</given-names></name> <name><surname>Kiryutin</surname> <given-names>B.</given-names></name> <name><surname>Koonin</surname> <given-names>E. V.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>The COG database: an updated version includes eukaryotes.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>4</volume>:<issue>41</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-4-41</pub-id> <pub-id pub-id-type="pmid">12969510</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Cheng</surname> <given-names>J.</given-names></name> <name><surname>Xu</surname> <given-names>D.</given-names></name> <name><surname>Jiang</surname> <given-names>L.</given-names></name></person-group> (<year>2015</year>). <article-title>Genetic interactions between the Golgi Ca<sup>2 + </sup>/H<sup>+</sup> exchanger Gdt1 and the plasma membrane calcium channel Cch1/Mid1 in the regulation of calcium homeostasis, stress response and virulence in Candida albicans.</article-title> <source><italic>FEMS Yeast Res.</italic></source> <volume>15</volume>:<issue>fov069</issue>. <pub-id pub-id-type="doi">10.1093/femsyr/fov069</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Workman</surname> <given-names>R. E.</given-names></name> <name><surname>Myrka</surname> <given-names>A. M.</given-names></name> <name><surname>Wong</surname> <given-names>G. W.</given-names></name> <name><surname>Tseng</surname> <given-names>E.</given-names></name> <name><surname>Welch</surname> <given-names>K. C.</given-names> <suffix>Jr.</suffix></name> <name><surname>Timp</surname> <given-names>W.</given-names></name></person-group> (<year>2018</year>). <article-title>Single-molecule, full-length transcript sequencing provides insight into the extreme metabolism of the ruby-throated hummingbird <italic>Archilochus colubris</italic>.</article-title> <source><italic>GigaScience</italic></source> <volume>7</volume> <issue>giy009</issue>.</citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xie</surname> <given-names>J.</given-names></name> <name><surname>Zuo</surname> <given-names>J.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>C.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name></person-group> (<year>2020</year>). <article-title>The origin and germplasm collection for cultivated <italic>Dendrobium</italic> officinale K. Kimura &#x0026; Migo individuals revealed by EST-SSR markers.</article-title> <source><italic>Genet. Resour. Crop Evol.</italic></source> <volume>67</volume> <fpage>1209</fpage>&#x2013;<lpage>1219</lpage>. <pub-id pub-id-type="doi">10.1007/s10722-020-00906-7</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>S. X.</given-names></name> <name><surname>Deng</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>M. S.</given-names></name></person-group> (<year>2008</year>). <article-title>Manganese uptake and accumulation in a woody hyperaccumulator <italic>Schima superba</italic>.</article-title> <source><italic>Plant Soil Environ.</italic></source> <volume>54</volume> <fpage>441</fpage>&#x2013;<lpage>446</lpage>. <pub-id pub-id-type="doi">10.17221/401-pse</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Z.</given-names></name> <name><surname>Zhang</surname> <given-names>R.</given-names></name> <name><surname>Zhou</surname> <given-names>Z.</given-names></name></person-group> (<year>2021</year>). <source><italic>Selection and Validation of Appropriate Reference Genes for Gene Expression Studies in Schima Superba.</italic></source></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>R.</given-names></name> <name><surname>Yang</surname> <given-names>H.</given-names></name> <name><surname>Zhou</surname> <given-names>Z.</given-names></name> <name><surname>Shen</surname> <given-names>B.</given-names></name> <name><surname>Xiao</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>B.</given-names></name></person-group> (<year>2019</year>). <article-title>A high-density genetic map of <italic>Schima superba</italic> based on its chromosomal characteristics.</article-title> <source><italic>BMC Plant Biol.</italic></source> <volume>19</volume>:<issue>41</issue>. <pub-id pub-id-type="doi">10.1186/s12870-019-1655-8</pub-id> <pub-id pub-id-type="pmid">30683049</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>Y.</given-names></name> <name><surname>Jiao</surname> <given-names>C.</given-names></name> <name><surname>Sun</surname> <given-names>H.</given-names></name> <name><surname>Rosli</surname> <given-names>H. G.</given-names></name> <name><surname>Pombo</surname> <given-names>M. A.</given-names></name> <name><surname>Zhang</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>iTAK: a program for genome-wide prediction and classification of plant transcription factors, transcriptional regulators, and protein kinases.</article-title> <source><italic>Mol. Plant</italic></source> <volume>9</volume> <fpage>1667</fpage>&#x2013;<lpage>1670</lpage>.</citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zuo</surname> <given-names>C.</given-names></name> <name><surname>Blow</surname> <given-names>M.</given-names></name> <name><surname>Sreedasyam</surname> <given-names>A.</given-names></name> <name><surname>Kuo</surname> <given-names>R. C.</given-names></name> <name><surname>Ramamoorthy</surname> <given-names>G. K.</given-names></name> <name><surname>Torres-Jerez</surname> <given-names>I.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Revealing the transcriptomic complexity of switchgrass by PacBio long-read sequencing.</article-title> <source><italic>Biotechnol. Biofuels</italic></source> <volume>11</volume>:<issue>170</issue>.</citation></ref>
</ref-list>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://pgrc.ipk-gatersleben.de/misa/">http://pgrc.ipk-gatersleben.de/misa/</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/COG">http://www.ncbi.nlm.nih.gov/COG</ext-link></p></fn>
</fn-group>
</back>
</article>