<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">749340</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2021.749340</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Comparative Transcriptional Landscape of Two Castor Cultivars Obtained by Single-Molecule Sequencing Comparative Analysis</article-title>
<alt-title alt-title-type="left-running-head">Zhou et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Comparative Transcriptional Landscape of Castor</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhou</surname>
<given-names>Yaxing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1510727/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhu</surname>
<given-names>Guoli</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1510836/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Yun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1510852/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Zhibiao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1510860/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Zhou</surname>
<given-names>Wei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1422537/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Agricultural College of Inner Mongolia Minzu University, <addr-line>Tongliao</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Tongliao Academy of Agricultural Science, <addr-line>Tongliao</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/37384/overview">Wei Xu</ext-link>, Texas A&#x26;M University Corpus Christi, United&#x20;States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/218953/overview">Katarzyna Agata Knop</ext-link>, University of Dundee, United&#x20;Kingdom</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/55589/overview">Milind B. Ratnaparkhe</ext-link>, ICAR Indian Institute of Soybean Research, India</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Wei Zhou, <email>ycyz958@yeah.net</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Genomic Assay Technology, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>10</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>749340</elocation-id>
<history>
<date date-type="received">
<day>29</day>
<month>07</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>30</day>
<month>09</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Zhou, Zhu, Wang, He and Zhou.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Zhou, Zhu, Wang, He and Zhou</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Background and Objectives:</bold> Castor (<italic>Ricinus communis</italic> L.) is an important non-edible oilseed crop. Lm-type female strains and normal amphiprotic strains are important castor cultivars, and are mainly different in their inflorescence structures and leaf shapes. To better understand the mechanisms underlying these differences at the molecular level, we performed a comparative transcriptional analysis.</p>
<p>
<bold>Materials and Methods:</bold> Full-length transcriptome sequencing and short-read RNA sequencing were employed.</p>
<p>
<bold>Results:</bold> A total of 76,068 and 44,223&#x20;non-redundant transcripts were obtained from high-quality transcripts of Lm-type female strains and normal amphiprotic strains, respectively. In Lm-type female strains and normal amphiprotic strains, 51,613 and 20,152 alternative splicing events were found, respectively. There were 13,239 transcription factors identified from the full-length transcriptomes. Comparative analysis showed a great variety of gene expression of common and unique transcription factors between the two cultivars. Meanwhile, a functional analysis of the isoforms was conducted. The full-length sequences were used as a reference genome, and a short-read RNA sequencing analysis was performed to conduct differential gene analysis. Furthermore, the function of DEGs were performed to annotation analysis.</p>
<p>
<bold>Conclusion:</bold> The results revealed considerable differences and expression diversity between the two cultivars, well beyond what was reported in previous studies and likely reflecting the differences in architecture between these two cultivars.</p>
</abstract>
<kwd-group>
<kwd>Lm type female strains</kwd>
<kwd>normal amphiprotic strains</kwd>
<kwd>pacbio</kwd>
<kwd>comparative transcriptome</kwd>
<kwd>isoform</kwd>
<kwd>full-length transcriptome</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>The castor plant (<italic>Ricinus communis</italic> L.), which originated in Africa, is an annual or perennial dicotyledonous. High ricinoleic acid content (80&#x2013;90%) and high fatty acid content (more than 45%) in its seed oil make it one of the most important non-edible oilseed crops, and this has attracted much attention from chemists, biologists, and medical scientists (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). The inflorescence of common castor plants is gradient monoecious raceme, with male flowers on the lower portion and female flowers at the apex (<xref ref-type="bibr" rid="B21">Tan et&#x20;al., 2015</xref>). Pistillate (bearing only female flowers) variations are bred to improve the seed yield. The Lm type castor is such a variety, obtained by exposing castor seeds to <sup>60</sup>Co&#x3b3;.</p>
<p>With the development of sequencing technology, next-generation sequencing (NGS) has become an essential method for the study of genomes, epigenomes, and transcriptomes (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). The NGS method has been used in many model and non-model plant species, and large-scale genome sequences and transcriptome data have been produced for deep analysis (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). However, the deficiencies of NGS, such as short reads, result in incompletely assembled transcripts that limit the better understanding of the transcriptomic data (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). The PacBio platform is based on the single-molecule real-time (SMRT) sequencing technology and provides longer and full-length transcripts without assembly, and can provide better information to understand the full-length transcriptome, such as alternative splicing, fusion transcripts, alternative polyadenylation, novel genes, and non-coding RNAs (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>).</p>
<p>To gain an insight into how sex is differentially regulated at the molecular level, in the present study, full-length transcriptomes of Lm-type and normal castor cultivars were analyzed, and short-read RNA sequencing and single-molecule long-read sequencing were utilized to identify the differentially expressed genes and alternative splicing events between Lm-type female strains and normal amphiprotic strains. Furthermore, the study will provide valuable data for future studies of sex determination on castor plants.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>Materials and Methods</title>
<p>Two cultivars, Lm-type female plants with willow-shaped leaves and normal amphiprotic plants (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>), were grown at the Experimental Base of the Agricultural College of INNER MONGOLIA MINZU UNIVERSITY, Tongliao City, Inner Mongolia Autonomous Region. The geographical position is between 42&#xb0;15&#x2032;-45&#xb0;41&#x2032; north latitude and 119&#xb0;15&#x2032;-123&#xb0;43&#x2032; east longitude. Ten plants of each cultivar were selected when the functional leaves grew to 1&#x2013;6&#xa0;cm (Lm-type) or 2&#x2013;15&#xa0;cm (normal type) on August 2nd, 2018. The Lm-type female plants and normal amphiprotic plants were designated as F01 and F02, respectively. For each cultivar around 10g of leaves and flowers were collected and frozen in liquid nitrogen and then stored at &#x2212;80&#xb0;C for subsequent RNA isolation. Using the Illumina HiSeq X Ten platform, RNA was extracted from 5g of frozen leaves or flowers with two repeats, and an RNA-Seq library construction was performed following the instructions (<xref ref-type="bibr" rid="B14">Podnar et&#x20;al., 2014</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The castor plant R. communis L. <bold>(A)</bold> Lm-type female strains with willow-shaped leaves. <bold>(B)</bold> Normal amphiprotic strains.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g001.tif"/>
</fig>
<sec id="s2-1">
<title>PacBio Library Construction and Sequencing</title>
<p>The total RNA was extracted from 5g mixtures of leaves and flowers (two repeats). Poly(T) oligo-attached magnetic beads (Dynal) were used to purify mRNA from about 3&#xa0;&#xb5;g total RNA. According to the protocols of the PacBio RS II platform, cDNA was synthesized using the SMART PCR cDNA Synthesis Kit (Clontech, CA, United&#x20;States), and then fractionated with BluePippin<sup>&#xae;</sup> (Sage Science, Beverly, MA, United&#x20;States). Then the final libraries were constructed using the Pacific Biosciences DNA Template Prep Kit (version 2.0). SMRT sequencing was performed with the Pacific Biosciences&#x2019; real-time sequencer using C2 sequencing reagents.</p>
</sec>
<sec id="s2-2">
<title>Preprocessing of SMRT Reads</title>
<p>The subreads were filtered using the standard protocol of the SMRT Analysis software suite (<ext-link ext-link-type="uri" xlink:href="http://www.pacificbiosciences.com">http://www.pacificbiosciences.com</ext-link>), and the reads of insert (ROIs) were obtained. After examining the poly(A) signals and 5&#x2032; and 3&#x2019; adaptors, full-length (FL) and non-full-length (nFL) reads were identified.</p>
<p>Consensus sequences were obtained from high-quality isoform sequences. The final transcriptome isoform sequences were filtered by removing the redundant sequences with the CD-HIT package (<ext-link ext-link-type="uri" xlink:href="http://weizhong-lab.ucsd.edu/cdhit_suite/cgi-bin/index.cgi?cmd=cd-hit">http://weizhong-lab.ucsd.edu/cdhit_suite/cgi-bin/index.cgi?cmd&#x3d;cd-hit</ext-link>) to cluster and compare protein or nucleotide sequences.</p>
</sec>
<sec id="s2-3">
<title>Alternative Splicing Analysis of Transcriptomes</title>
<p>To identify alternative splicing (AS) events, SpliceGrapher (<xref ref-type="bibr" rid="B16">Rogers et&#x20;al., 2012</xref>) was used to analyze the transcriptome-wide AS events. AS events were predicted from non-redundant transcripts. The prediction criterion is as following: the sequence should be greater than 1,000&#xa0;bp, the AS gap should be greater than 100&#xa0;bp and at least 100&#xa0;bp from the 3&#x27;-/5&#x27;-end, and there should be a 5-bp overlap in the spliced transcript. Compared with the reference castor genome (<ext-link ext-link-type="uri" xlink:href="http://castorbean.jcvi.org/">http://castorbean.jcvi.org/</ext-link>), the full-length transcripts can be classified as derivations from the known genes and novel genetic&#x20;loci.</p>
<p>Candidate coding regions were identified by TransDecoder (Broad Institute, Cambridge, MA, United&#x20;States) from the final transcriptome isoform sequence. Sequences were searched using BLASTX (<xref ref-type="bibr" rid="B2">Buchfink et&#x20;al., 2015</xref>) against the NCBI non-redundant protein and the UniProt with E-value cutoff at 1&#x20;&#xd7; 10<sup>&#x2212;6</sup>. To further distinguish protein-coding and non-coding RNAs, the dbHT-Trans tool (v1.0) (<xref ref-type="bibr" rid="B4">Deng and Chen 2016</xref>) was used for all PacBio transcripts.</p>
<p>The gene ontology (GO) enrichments were analyzed using the GOseq (<xref ref-type="bibr" rid="B25">Young et&#x20;al., 2010</xref>). The KEGG (<ext-link ext-link-type="uri" xlink:href="http://www.genome.jp/kegg/">http://www.genome.jp/kegg/</ext-link>) pathway analysis was implemented as reported (<xref ref-type="bibr" rid="B9">Kanehisa et&#x20;al., 2017</xref>).</p>
</sec>
<sec id="s2-4">
<title>Short-Read RNA Sequencing Analysis and Quantification of Gene Expression</title>
<p>The clean reads were screened from raw sequencing reads by removing low-quality reads and reads containing adaptors or ploy-Ns. Sequences of clean reads were aligned to the full-length sequences. Differential expression analysis was performed with EBSeq package (<xref ref-type="bibr" rid="B11">Leng et&#x20;al., 2013</xref>), with FDR &#x3c;0.05 and &#x7c;log2 (fold-change) &#x7c; &#x2265;1.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>PacBio Iso-Seq Sequencing</title>
<p>The SMRT sequencing generated 456,994 polymerase reads in total, and 26.25&#xa0;Gb and 16.38&#xa0;Gb clean reads were obtained from Lm-type female and normal castor cultivars, respectively. Under the conditions of full passes of &#x2265;0 and quality of &#x3e;0.80, 647,205 and 328,497 ROIs were obtained from two cultivars, respectively (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). In addition, 448,217 and 258,645&#x20;full-length non-chimeric sequences were identified from Lm-type and normal castors, respectively (<xref ref-type="sec" rid="s10">Supplementary Table&#x20;S2</xref>).</p>
<p>The SMRT sequencing generated 456,994 polymerase reads in total, and 26.25&#xa0;Gb and 16.38&#xa0;Gb of clean reads were obtained from Lm-type female and normal castor cultivars, respectively. Under the conditions of full passes of &#x2265;0 and quality of &#x3e;0.80, 647,205 and 328,497 ROIs were obtained from two cultivars, respectively (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>). In addition, 448,217 and 258,645&#x20;full-length non-chimeric sequences were identified from Lm-type and normal castors, respectively (<xref ref-type="sec" rid="s10">Supplementary Table&#x20;S2</xref>).</p>
<p>The lengths of full-length cDNA in the Lm-type female strain ranged from 281 to 11,430&#xa0;bp with an average length of 2,702&#xa0;bp. For the normal castor strain, the full-length cDNA showed an average length of 2,192&#xa0;bp, and ranged from 303 to 9,681&#xa0;bp. The N50 values of that cDNA were 3,093 and 2,408&#xa0;bp in Lm-type and normal castor cultivars, respectively. Then, from 223,929 (Lm-type female cultivar) and 138,066 (normal castor) full-length consensuses cDNA, 76,068 out of 154,517 (49%) and 44,223 out of 105,536 (42%) high quality full-length consensuses were obtained, respectively. The ICE clustering results are shown in <xref ref-type="table" rid="T1">Table&#x20;1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The statistic results of ICE clustering.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Samples</th>
<th align="center">Number of consensus isoforms</th>
<th align="center">Average consensus isoforms read length</th>
<th align="center">Number of polished high-quality isoforms</th>
<th align="center">Number of polished low-quality isoforms</th>
<th align="center">Percent of polished high-quality isoforms (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">F01</td>
<td align="center">223,929</td>
<td align="center">2,552</td>
<td align="center">154,517</td>
<td align="center">68,417</td>
<td align="char" char=".">69.00</td>
</tr>
<tr>
<td align="left">F02</td>
<td align="center">138,066</td>
<td align="center">2,056</td>
<td align="center">105,536</td>
<td align="center">32,086</td>
<td align="char" char=".">76.44</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-2">
<title>Alternative Splicing and Polyadenylation</title>
<p>A total of 51,613 and 20,152 AS events were found in Lm-type and normal castor cultivars, respectively, including exon skipping (ES), intron retention (IR), alternative 3&#x2032; sites (Alt. 3&#x2032;), alternative 5&#x2032; sites (Alt. 5&#x2019;), and mutually exclusive exons. The results showed that intron retention (IR) was the foremost AS event, with 62.14% and 55.94% in Lm-type and normal castor cultivars, respectively. The results of statistical analysis of different AS events in Lm-type female strain and normal castor were showed in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref> and <xref ref-type="sec" rid="s10">Supplementary Table&#x20;S3</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The statistics of different AS events of two cultivars. <bold>(A)</bold> AS events of Lm-type female strain. <bold>(B)</bold> AS events of normal castor.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g002.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>Comparative Analysis of LncRNA and Transcription Factors</title>
<p>Transcription factors which need to specifically bind to certain genes are essential for the regulation of gene expression. A total of 13,239 encoded transcription factors were identified from the full-length transcriptome in the two cultivars. Furthermore, we performed a comparative analysis of the common and unique transcription factors in the two cultivars. The main transcription factor types in Lm-type female castor include Rlk-Pelle-Dlsv, C3H, SNF2, and MYB-related families. In normal castor, the dominant transcription factors were Rlk-pelle-dlsv, camk-camkl-chk1, and MYB-related bHLH types. Although the two cultivars shared some types of transcription factors, the expression of corresponding genes was completely different (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Statistics of transcription factors of two cultivars. <bold>(A)</bold> The number of transcription factors only in F01. <bold>(B)</bold> The number of transcription factors only in F01. <bold>(C)</bold> The number of transcription factors common in F01 and F02.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g003.tif"/>
</fig>
<p>As the key regulators in biological processes, long non-coding RNA (LncRNA) is a type of RNA that does not encode proteins (<xref ref-type="bibr" rid="B8">Jathar et&#x20;al., 2017</xref>). A total of 858 lncRNAs were found in the two cultivars using CPC, CNCI, CPAT, and PFAM software (<xref ref-type="bibr" rid="B6">Gong et&#x20;al., 2017</xref>). The genomic distributions of LncRNAs were classified into four types, namely lincRNA, antisense-lncRNA, intronic-lncRNA, and sense_lncRNA. The ratios of different types varied greatly, with 285 lincRNA, 58&#x20;antisense-lncRNA, 7&#x20;intronic-lncRNA, and 166 sense_lncRNA in the Lm-type, and 60, 22, 3, and 49 in the normal castor cultivar, respectively (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Statistics of LncRNA in two cultivars. <bold>(A)</bold> Venn diagram of LncRNAs using CPC, CNCI, CPAT, and PFAM software. <bold>(B)</bold> Statistics of LncRNA types in genomic distributions. <bold>(C)</bold> Statistics of LncRNA types only in F01. <bold>(D)</bold> Statistics of LncRNA types only in F02. <bold>(E)</bold> Statistics of LncRNA types common in F01 and F02.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g004.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>Functional Annotation and Analysis of Isoform</title>
<p>For the functional annotation of gene isoforms, these genes were searched against the Genbank NR, Swissprot, GO, COG, KOG, Pfam, and KEGG databases, and a total of 85,322 genes were annotated by those seven databases. Among them, 85,286 genes (99.96%) were aligned to the NR, and 62,336 genes were matched to the SWISS-PROT (<xref ref-type="table" rid="T2">Table&#x20;2</xref>). Approximately 79.21% of genes were aligned to <italic>R. communis</italic>, followed by <italic>Jatropha curcas</italic> (8.27%) (<xref ref-type="fig" rid="F5">Figure&#x20;5A</xref>).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Statistics of annotations for genes of castor.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Anno database</th>
<th align="center">Annotated number</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">COG Annotation</td>
<td align="center">35,743</td>
</tr>
<tr>
<td align="left">GO Annotation</td>
<td align="center">61,390</td>
</tr>
<tr>
<td align="left">KEGG Annotation</td>
<td align="center">39,598</td>
</tr>
<tr>
<td align="left">KOG Annotation</td>
<td align="center">57,228</td>
</tr>
<tr>
<td align="left">Pfam Annotation</td>
<td align="center">63,089</td>
</tr>
<tr>
<td align="left">Swissprot Annotation</td>
<td align="center">62,336</td>
</tr>
<tr>
<td align="left">eggNOG Annotation</td>
<td align="center">83,826</td>
</tr>
<tr>
<td align="left">Nr Annotation</td>
<td align="center">85,286</td>
</tr>
<tr>
<td align="left">All Annotated</td>
<td align="center">85,322</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Statistics of the gene annotation in castor R. communis. <bold>(A)</bold> Nr homologous species distribution statistics. <bold>(B)</bold> GO annotation classification statistics. <bold>(C)</bold> COG annotation classification statistics.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g005.tif"/>
</fig>
<p>The GO annotation system is a directed acyclic graph, including three categories: biological process (BP), molecular function (MF), and cellular component (CC). In this study, GO analysis was conducted using Blast2GO, and detailed GO distributions in GO categories are shown in <xref ref-type="fig" rid="F5">Figure&#x20;5B</xref>. The vast majority of the genes were in cells or cell parts in the cellular component. In the molecular function class, most of the genes were classified as catalytic activity and binding. In the biological process class, genes classified as metabolic processes and cellular processes were the most common. &#x201c;COG&#x201d; refers to clusters of orthologous groups for eukaryotic complete genomes, and every protein in the database is assumed to be evolved from a common ancestor protein. In total, 35,743 out of 85,286 genes were classified into 25 different COG categories (<xref ref-type="fig" rid="F5">Figure&#x20;5C</xref>), and the genes with general functions were the largest category, followed by replication, recombination and repair, and transcription.</p>
<p>The KEGG database is used to determine whether the genes are involved in specific metabolic or signal transduction pathways. In this study, a total of 125 KEGG pathways were identified. Several enriched pathways were involved in plant hormone signal transduction (ko04075), starch and sucrose metabolism (ko00500), and protein processing in the endoplasmic reticulum (ko04141) (<xref ref-type="sec" rid="s10">Supplementary list&#x20;S1</xref>).</p>
</sec>
<sec id="s3-5">
<title>Functional Comparative Analysis of Isoform</title>
<p>For further annotation analysis of gene functionality, the functions of specific and common isoforms in the two samples were analyzed systematically, indicating that although many of the isoforms in the two samples were different, the corresponding gene functions were similar. The GO analysis showed that many of the isoforms enriched in the following items: metabolic process, cellular single-organism, cell part, catalytic activity, and binding (<xref ref-type="fig" rid="F6">Figure&#x20;6</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Statistics of the GO classification in two cultivars. <bold>(A)</bold> GO annotation classification statistics common in F01 and F02. <bold>(B)</bold> GO annotation classification statistics only in F01. <bold>(C)</bold> GO annotation classification statistics only in F02.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g006.tif"/>
</fig>
<p>The results of the COG functional annotation analysis on the specific and common isoforms in Lm-type and normal castors were similar to that of the GO analysis, and the function of the isoforms remained consistent. The COG analysis indicated the most common gene functions in L (replication, recombination and repair) and R (general function prediction) (<xref ref-type="fig" rid="F7">Figure&#x20;7</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Statistics of the COG classification in two cultivars. <bold>(A)</bold> COG annotation classification statistics common in F01 and F02. <bold>(B)</bold> COG annotation classification statistics only in F01. <bold>(C)</bold> COG annotation classification statistics only in F02.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g007.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>Genes Associated With Sex Expression and Reproduction in Castor</title>
<p>According to previous studies of sex determination between the monoecious and female <italic>R. communis</italic>, several subgroups genes were assumed to be putatively related to sex determination, such as auxin response factor, dynamin-2A, PCI domain containing protein, Xaa-Pro amino peptidase, ATP-binding protein, set domain protein, spermidine synthase, arginine/serine-rich splicing factor, eukaryotic translation initiation factor 2c, DNA (cytosine-5)-methyltransferase, s-adenosyl-methyltransferase, and acid phosphatase. In this study, many of these subgroups were identified in novel unigenes (<xref ref-type="table" rid="T3">Table&#x20;3</xref>). These genes were associated with hormone stimulus and participate in hormone-mediated signaling pathways, and also play a role in tissue and organ developmental processes.</p>
<table-wrap id="T3" position="float">
<label>TABLE3</label>
<caption>
<p>Putative genes involved in sex determination of R. communis.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Gene name</th>
<th align="center">Numbers in novel unigenes</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Dynamin-2A</td>
<td align="char" char=".">17</td>
</tr>
<tr>
<td align="left">Auxin response factor</td>
<td align="char" char=".">232</td>
</tr>
<tr>
<td align="left">ATP-binding protein</td>
<td align="char" char=".">3</td>
</tr>
<tr>
<td align="left">Spermidine synthase</td>
<td align="char" char=".">20</td>
</tr>
<tr>
<td align="left">Arginine/serine-rich splicing factor</td>
<td align="char" char=".">72</td>
</tr>
<tr>
<td align="left">Acid phosphatase</td>
<td align="char" char=".">123</td>
</tr>
<tr>
<td align="left">Eukaryotic translation initiation factor 2c</td>
<td align="char" char=".">124</td>
</tr>
<tr>
<td align="left">Set domain protein</td>
<td align="char" char=".">30</td>
</tr>
<tr>
<td align="left">DNA (cytosine-5)-methyltransferase</td>
<td align="char" char=".">23</td>
</tr>
<tr>
<td align="left">S-adenosyl-methyltransferase</td>
<td align="char" char=".">4</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-7">
<title>Comparative Analysis of Differential Gene Expression Profiling</title>
<p>The full-length sequences were used as a reference genome, and the sequences from the short-read RNA sequencing were used to conduct a differential gene analysis. A total of 2,461 genes were found to be differentially expressed, with 655&#x20;up-regulated and 1806&#x20;down-regulated. These differentially expressed genes (both up-regulated genes and down-regulated genes) were classified according to their KEGG pathway (<xref ref-type="fig" rid="F8">Figure&#x20;8</xref>). The results showed that up-regulated genes were classified as pathways of ribisome, carbon metabolism, pentose phosphate pathway, and biosynthesis of amino acids. The down-regulated genes were involved in plant hormone signal transduction, phenylpropanoid biosynthesis, carbon metabolism, and plant-pathogen interaction.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Statistics of DEGs and corresponding function in two cultivars. <bold>(A)</bold> Volcano plot of DEGs. The green dots represent down-regulated DEGs, the red dots represent up-regulated DEGs, and the black dots represent non-differentially expressed genes. <bold>(B)</bold> KEGG classification of up-regulated DEGs. <bold>(C)</bold> KEGG classification of down-regulated DEGs.</p>
</caption>
<graphic xlink:href="fgene-12-749340-g008.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Alternative splicing was involved in phenotypic differences of Lm-type and normal castor cultivars.</p>
<p>In recent years, comparative transcriptome analyses have successfully revealed specific genes responsible for C4 photosynthesis in many grasses, including maize and switchgrass (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). Furthermore, recent studies of castor transcriptomes are mainly focused on gene expression from short-read RNA sequencing (<xref ref-type="bibr" rid="B18">Sood et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B19">Sturtevant et&#x20;al., 2019</xref>) which cannot identify alternative gene splice forms (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). The development of full-length sequencing technology provides a span-new approach to study full-length sequences, alterative splicing, gene structures, and APA of RNA (<xref ref-type="bibr" rid="B7">Grabherr et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B15">Rhoads and Au 2015</xref>). We thus conducted a comprehensive comparative analysis for two cultivars using this method. In this work, a total of 76,068 and 44,223&#x20;non-redundant transcripts were obtained from the high-quality transcripts of Lm-type female strain and normal castor cultivars, respectively. Among these genes, 51,613 and 20,152 AS events were found in Lm-type female strain and normal castor, respectively, of which intron retention (IR) was the foremost AS event, with 62.14% and 55.94% in the two cultivars, respectively. Its confirmed gene expression and splicing levels may have a significant impact on the morphological and other phenotypic differences between the two cultivars (<xref ref-type="bibr" rid="B22">Wang et&#x20;al., 2018</xref>). The alternative splicing of eukaryotic transcripts is a mechanism that enables cells to generate vast protein diversity from a limited number of genes (<xref ref-type="bibr" rid="B1">Baralle and Giudice 2017</xref>; <xref ref-type="bibr" rid="B3">Bush et&#x20;al., 2017</xref>). The mechanism and outcomes of the alternative splicing of individual transcripts are well understood (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). Some studies find that AS regulation is independent or partially independent of transcriptional regulation (<xref ref-type="bibr" rid="B17">Siam et&#x20;al., 2019</xref>) and implements great function at the early stage of the heat response (<xref ref-type="bibr" rid="B10">Keller et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B17">Siam et&#x20;al., 2019</xref>), useful for future heat sensing and signaling studies (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). Our new findings about AS provide important information for facilitating castor genome annotation, and the full characterization of the castor transcriptome.</p>
<sec id="s4-1">
<title>Transcription Factors and lncRNAs Played Important Role in Phenotypic Differences of Lm-Type and Normal Castor Cultivars</title>
<p>As the key regulators of transcription, TFs play an important role in the physiological regulation of plants (<xref ref-type="bibr" rid="B13">Olsen et&#x20;al., 2005</xref>; <xref ref-type="bibr" rid="B27">Zhou and Memelink 2016</xref>). Our results (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>) suggested Rlk-pelle-dlsv, C3H, SNF2, and MYB-related transcription factors were the main types in the Lm-type cultivar. Transcription factors of rlk-pelle-dlsv, camk-camkl-chk1, MYB-related bHLH, and other types were mainly expressed in the normal castor cultivar. We speculate that the difference in TFs has a significant effect on the difference in morphology. Similarly, as the important regulator, the number of lncRNA was very different: there were 285 lincRNA, 58&#x20;antisense-lncRNA, 7&#x20;intronic-lncRNA, and 166 sense_lncRNA in the Lm-type cultivar, while 60, 22, 3, and 49 in the normal castor cultivar, respectively. Emerging work has revealed that many types of lncRNA regulate gene expression and have a great influence on genome stability in plants (<xref ref-type="bibr" rid="B23">Wang and Chekanova 2017</xref>; <xref ref-type="bibr" rid="B20">Sun et&#x20;al., 2018</xref>). Studies on Arabidopsis show that lncRNA can serve as a molecular sponge and as a decoy, functioning in the regulation of transcription and silencing, particularly in RNA-directed DNA methylation, and in epigenetic regulation of flowering time (<xref ref-type="bibr" rid="B26">Zhao et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B12">Liu et&#x20;al., 2019</xref>). Many plants reduce the expression of some lncRNAs to affect developmental phenotypes or molecular changes (<xref ref-type="bibr" rid="B24">Wang et&#x20;al., 2014</xref>). We speculate that these regulators also played an important role in the growth and development of castor, and contribute significantly to phenotypic differences of Lm-type and normal cultivars.</p>
</sec>
<sec id="s4-2">
<title>DEGs Implement a Significant Function in the Morphological Differences of the Two Cultivars</title>
<p>Using the full-length sequences as a reference genome, 2,461 differentially expressed genes were found, including 655&#x20;up-regulated genes and 1806&#x20;down-regulated genes, which was far more than in our previous RNA-seq transcriptome analysis (<xref ref-type="bibr" rid="B5">Fan et&#x20;al., 2019</xref>). In this study, the functional analysis showed that proteins encoded by up-regulated genes (655) were classified to ribisome, carbon metabolism, pentose phosphate pathway, and biosynthesis of amino acids. Proteins encoded by down-regulated genes (1806) were attributed to plant hormone signal transduction, phenyl propanoid biosynthesis, carbon metabolism, and plant-pathogen interaction. We speculate that the differentially expressed genes were the main reason for the differences between the two castors, while the specific regulation mechanisms remain unclear.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>To the best of our knowledge, this study is the first large-scale comparative analysis of the transcriptome Lm-type and normal castor cultivars by single-molecule long-read sequencing. Comparative analysis of the isoforms, transcription factors, lncRNAs, and AS in the two cultivars was performed systematically. The gene annotation analysis showed that although the isoforms were diverse in the two cultivars, the implemented functions were similar. Many species-specific differences are mainly attributed to small effects at multiple loci, probably. However, differences in the expression of genes and alternative splicing events have a profound effect on the evolution of major morphological diversification for different individuals in the developmental processes. The new findings of this study provided invaluable information for facilitating genome annotation and the full characterization of the transcriptome of these two cultivars.</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, SRR8662424; <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, SRR8662425.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>WZ performed the study, analyzed data, involved in the writing of the manuscript. YZ involved in data analyses, helped in writing the manuscript. GZ involved in sample collection and preparation, and helped in writing the manuscript. YW and ZH helped perform the analysis, and provided constructive discussions. All authors have read and approved the final manuscript.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The authors appreciate the great help from GZ of the Tongliao Academy of Agricultural Sciences and ZS of the Shenyang Agricultural University.</p>
</ack>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.749340/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.749340/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Figure2.JPEG" id="SM1" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure5.JPEG" id="SM2" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure3.JPEG" id="SM3" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure1.JPEG" id="SM4" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure4.JPEG" id="SM5" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table7.DOCX" id="SM6" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure8.JPEG" id="SM7" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.DOC" id="SM8" mimetype="application/DOC" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table5.DOCX" id="SM9" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure7.JPEG" id="SM10" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.DOCX" id="SM11" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Figure6.JPEG" id="SM12" mimetype="application/JPEG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table6.DOCX" id="SM13" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.DOC" id="SM14" mimetype="application/DOC" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baralle</surname>
<given-names>F. E.</given-names>
</name>
<name>
<surname>Giudice</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Alternative Splicing as a Regulator of Development and Tissue Identity</article-title>. <source>Nat. Rev. Mol. Cel Biol</source> <volume>18</volume>, <fpage>437</fpage>&#x2013;<lpage>451</lpage>. <pub-id pub-id-type="doi">10.1038/nrm.2017.27</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buchfink</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Huson</surname>
<given-names>D. H.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Fast and Sensitive Protein Alignment Using DIAMOND</article-title>. <source>Nat. Methods</source> <volume>12</volume>, <fpage>59</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3176</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bush</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tovar-Corona</surname>
<given-names>J.&#x20;M.</given-names>
</name>
<name>
<surname>Urrutia</surname>
<given-names>A. O.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Alternative Splicing and the Evolution of Phenotypic novelty</article-title>, <source>Phil. Trans. R. Soc. B</source>, <volume>372</volume>, <fpage>20150474</fpage>. <pub-id pub-id-type="doi">10.1098/rstb.2015.0474</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deng</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.-Y.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>dbHT-Trans: An Efficient Tool for Filtering the Protein-Encoding Transcripts Assembled by RNA-Seq According to Search for Homologous Proteins</article-title>. <source>J.&#x20;Comput. Biol.</source> <volume>23</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2015.0137</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Sequencing of Chinese castor Lines Reveals Genetic Signatures of Selection and Yield-Associated Loci</article-title>. <source>Nat. Commun.</source> <volume>10</volume>, <fpage>3418</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-019-11228-3</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>H.-T.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Trimarchi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Aifantis</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Tsirigos</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>lncRNA-Screen: an Interactive Platform for Computationally Screening Long Non-coding RNAs in Large Genomics Datasets</article-title>. <source>BMC genomics</source> <volume>18</volume>, <fpage>434</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-017-3817-0</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grabherr</surname>
<given-names>M. G.</given-names>
</name>
<name>
<surname>Haas</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Yassour</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Levin</surname>
<given-names>J.&#x20;Z.</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Amit</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Full-length Transcriptome Assembly from RNA-Seq Data without a Reference Genome</article-title>. <source>Nat. Biotechnol.</source> <volume>29</volume>, <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jathar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Srivastava</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tripathi</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2017</year>). <source>Technological Developments in lncRNA Biology</source>. <source>Adv. Exp. Med. Biol.</source> <volume>1008</volume>, <fpage>283</fpage>&#x2013;<lpage>323</lpage>. <pub-id pub-id-type="doi">10.1007/978-981-10-5203-3_10</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kanehisa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Furumichi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tanabe</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sato</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Morishima</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>KEGG: New Perspectives on Genomes, Pathways, Diseases and Drugs</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>D353</fpage>&#x2013;<lpage>d361</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1092</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keller</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Mesihovic</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fragkostefanakis</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Schleiff</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Simm</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Alternative Splicing in Tomato Pollen in Response to Heat Stress</article-title>. <source>DNA Res.</source> <volume>24</volume>, <fpage>dsw051</fpage>&#x2013;<lpage>217</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/dsw051</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Leng</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Dawson</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Thomson</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Ruotti</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Rissman</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Smits</surname>
<given-names>B. M. G.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <source>EBSeq: an Empirical Bayes Hierarchical Model for Inference in RNA-Seq Experiments</source>. <publisher-loc>Oxford, England</publisher-loc>: <publisher-name>Bioinformatics</publisher-name>, <fpage>1035</fpage>&#x2013;<lpage>1043</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt087</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>The Long Noncoding RNA T5120 Regulates Nitrate Response and Assimilation in Arabidopsis</article-title>. <source>New Phytol.</source> <volume>224</volume>, <fpage>117</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1111/nph.16038</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olsen</surname>
<given-names>A. N.</given-names>
</name>
<name>
<surname>Ernst</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>Leggio</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Skriver</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>NAC Transcription Factors: Structurally Distinct, Functionally Diverse</article-title>. <source>Trends Plant Sci.</source> <volume>10</volume>, <fpage>79</fpage>&#x2013;<lpage>87</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2004.12.010</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Podnar</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Deiderick</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Huerta</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Hunicke&#x2010;Smith</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Next&#x2010;Generation Sequencing RNA&#x2010;Seq Library Construction</article-title>. <source>Curr. Protoc. Mol. Biol.</source> <volume>106</volume>, <fpage>4</fpage>&#x2013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1002/0471142727.mb0421s106</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rhoads</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Au</surname>
<given-names>K. F.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>PacBio Sequencing and its Applications</article-title>. <source>Genomics, Proteomics &#x26; Bioinformatics</source> <volume>13</volume>, <fpage>278</fpage>&#x2013;<lpage>289</lpage>. <pub-id pub-id-type="doi">10.1016/j.gpb.2015.08.002</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rogers</surname>
<given-names>M. F.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Reddy</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Ben-Hur</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>SpliceGrapher: Detecting Patterns of Alternative Splicing from RNA-Seq Data in the Context of Gene Models and EST Data</article-title>. <source>Genome Biol.</source> <volume>13</volume>, <fpage>R4</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2012-13-1-r4</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Siam</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Baker</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Amit</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Regev</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Rabner</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Najar</surname>
<given-names>R. A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Regulation of Alternative Splicing by P300-Mediated Acetylation of Splicing Factors</article-title>. <source>Rna</source>, <volume>25</volume>, <fpage>813</fpage>&#x2013;<lpage>824</lpage>. <pub-id pub-id-type="doi">10.1261/rna.069856.118</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sood</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Jaiswal</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Chanumolu</surname>
<given-names>S. K.</given-names>
</name>
<name>
<surname>Malhotra</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Pal</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chauhan</surname>
<given-names>R. S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Mining Whole Genomes and Transcriptomes of Jatropha (Jatropha Curcas) and Castor Bean (Ricinus communis) for NBS-LRR Genes and Defense Response Associated Transcription Factors</article-title>. <source>Mol. Biol. Rep.</source> <volume>41</volume>, <fpage>7683</fpage>&#x2013;<lpage>7695</lpage>. <pub-id pub-id-type="doi">10.1007/s11033-014-3661-0</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sturtevant</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Romsdahl</surname>
<given-names>T. B.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>X.-H.</given-names>
</name>
<name>
<surname>Burks</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Azad</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Shanklin</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Tissue-specific Differences in Metabolites and Transcripts Contribute to the Heterogeneity of Ricinoleic Acid Accumulation in Ricinus communis L. (castor) Seeds</article-title>. <source>Metabolomics</source> <volume>15</volume>, <fpage>6</fpage>. <pub-id pub-id-type="doi">10.1007/s11306-018-1464-3</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sui</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Regulation Mechanism of Long Non-coding RNA in Plant Response to Stress</article-title>. <source>Biochem. biophysical Res. Commun.</source> <volume>503</volume>, <fpage>402</fpage>&#x2013;<lpage>407</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2018.07.072</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Transcriptomic Analysis for Different Sex Types of Ricinus communis L. During Development from Apical Buds to Inflorescences by Digital Gene Expression Profiling</article-title>. <source>Front. Plant Sci.</source> <volume>6</volume>, <fpage>1208</fpage>. <pub-id pub-id-type="doi">10.3389/fpls.2015.01208</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Regulski</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tseng</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Olson</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Goodwin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>McCombie</surname>
<given-names>W. R.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>A Comparative Transcriptional Landscape of maize and Sorghum Obtained by Single-Molecule Sequencing</article-title>. <source>Genome Res.</source> <volume>28</volume>, <fpage>921</fpage>&#x2013;<lpage>932</lpage>. <pub-id pub-id-type="doi">10.1101/gr.227462.117</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.-L. V.</given-names>
</name>
<name>
<surname>Chekanova</surname>
<given-names>J.&#x20;A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Long Noncoding RNAs in Plants</article-title>. <source>Adv. in Exp. Med. Biol.</source> <volume>1008</volume>, <fpage>133</fpage>&#x2013;<lpage>154</lpage>. <pub-id pub-id-type="doi">10.1007/978-981-10-5203-3_5</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>T.-T.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Genomic Features and Regulatory Roles of Intermediate-Sized Non-coding RNAs in Arabidopsis</article-title>. <source>Mol. Plant</source> <volume>7</volume>, <fpage>514</fpage>&#x2013;<lpage>527</lpage>. <pub-id pub-id-type="doi">10.1093/mp/sst177</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Young</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Wakefield</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Smyth</surname>
<given-names>G. K.</given-names>
</name>
<name>
<surname>Oshlack</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Gene Ontology Analysis for RNA-Seq: Accounting for Selection Bias</article-title>. <source>Genome Biol.</source> <volume>11</volume>, <fpage>R14</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2010-11-2-r14</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Lian</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Global Identification of Arabidopsis lncRNAs Reveals the Regulation of MAF4 by a Natural Antisense RNA</article-title>. <source>Nat. Commun.</source> <volume>9</volume>, <fpage>5056</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-07500-7</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Memelink</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Jasmonate-responsive Transcription Factors Regulating Plant Secondary Metabolism</article-title>. <source>Biotechnol. Adv.</source> <volume>34</volume>, <fpage>441</fpage>&#x2013;<lpage>449</lpage>. <pub-id pub-id-type="doi">10.1016/j.biotechadv.2016.02.004</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>